{"id":"https://openalex.org/W6908585519","doi":"https://doi.org/10.26190/unsworks/30630","title":"Speech Based Continuous Emotion Recognition: Modelling of Ambiguity and Temporal Dynamics","display_name":"Speech Based Continuous Emotion Recognition: Modelling of Ambiguity and Temporal Dynamics","publication_year":2024,"publication_date":"2024-01-01","ids":{"openalex":"https://openalex.org/W6908585519","doi":"https://doi.org/10.26190/unsworks/30630"},"language":"en","primary_location":{"id":"pmh:oai:unsworks.library.unsw.edu.au:1959.4/103386","is_oa":true,"landing_page_url":"http://hdl.handle.net/1959.4/103386","pdf_url":null,"source":{"id":"https://openalex.org/S4306401737","display_name":"UNSWorks (University of New South Wales, Sydney, Australia)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I40053085","host_organization_name":"Australian Defence Force Academy","host_organization_lineage":["https://openalex.org/I40053085"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"http://purl.org/coar/resource_type/c_db06"},"type":"dissertation","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://hdl.handle.net/1959.4/103386","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Wu, Jingyao","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Wu, Jingyao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9553999900817871,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9553999900817871,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.004999999888241291,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10709","display_name":"Social Robot Interaction and HRI","score":0.003100000089034438,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/ambiguity","display_name":"Ambiguity","score":0.7717999815940857},{"id":"https://openalex.org/keywords/salience","display_name":"Salience (neuroscience)","score":0.645799994468689},{"id":"https://openalex.org/keywords/valence","display_name":"Valence (chemistry)","score":0.4968000054359436},{"id":"https://openalex.org/keywords/dynamics","display_name":"Dynamics (music)","score":0.4587000012397766},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.444599986076355},{"id":"https://openalex.org/keywords/cognition","display_name":"Cognition","score":0.4424999952316284},{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.41909998655319214},{"id":"https://openalex.org/keywords/expression","display_name":"Expression (computer science)","score":0.3953000009059906},{"id":"https://openalex.org/keywords/natural","display_name":"Natural (archaeology)","score":0.3736000061035156}],"concepts":[{"id":"https://openalex.org/C2780522230","wikidata":"https://www.wikidata.org/wiki/Q1140419","display_name":"Ambiguity","level":2,"score":0.7717999815940857},{"id":"https://openalex.org/C108154423","wikidata":"https://www.wikidata.org/wiki/Q1469792","display_name":"Salience (neuroscience)","level":2,"score":0.645799994468689},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.5407000184059143},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5054000020027161},{"id":"https://openalex.org/C168900304","wikidata":"https://www.wikidata.org/wiki/Q171407","display_name":"Valence (chemistry)","level":2,"score":0.4968000054359436},{"id":"https://openalex.org/C145912823","wikidata":"https://www.wikidata.org/wiki/Q113558","display_name":"Dynamics (music)","level":2,"score":0.4587000012397766},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.444599986076355},{"id":"https://openalex.org/C169900460","wikidata":"https://www.wikidata.org/wiki/Q2200417","display_name":"Cognition","level":2,"score":0.4424999952316284},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.4284000098705292},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.41909998655319214},{"id":"https://openalex.org/C90559484","wikidata":"https://www.wikidata.org/wiki/Q778379","display_name":"Expression (computer science)","level":2,"score":0.3953000009059906},{"id":"https://openalex.org/C2776608160","wikidata":"https://www.wikidata.org/wiki/Q4785462","display_name":"Natural (archaeology)","level":2,"score":0.3736000061035156},{"id":"https://openalex.org/C6438553","wikidata":"https://www.wikidata.org/wiki/Q1185804","display_name":"Affective computing","level":2,"score":0.3472000062465668},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.3441999852657318},{"id":"https://openalex.org/C2777438025","wikidata":"https://www.wikidata.org/wiki/Q1339090","display_name":"Emotion recognition","level":2,"score":0.3140999972820282},{"id":"https://openalex.org/C2778023277","wikidata":"https://www.wikidata.org/wiki/Q321703","display_name":"Premise","level":2,"score":0.3131999969482422},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3124000132083893},{"id":"https://openalex.org/C2780733359","wikidata":"https://www.wikidata.org/wiki/Q331769","display_name":"Mood","level":2,"score":0.31150001287460327},{"id":"https://openalex.org/C87868495","wikidata":"https://www.wikidata.org/wiki/Q750843","display_name":"Information processing","level":2,"score":0.29490000009536743},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.2948000133037567},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.28110000491142273},{"id":"https://openalex.org/C206310091","wikidata":"https://www.wikidata.org/wiki/Q750859","display_name":"Emotion classification","level":2,"score":0.2799000144004822},{"id":"https://openalex.org/C36951298","wikidata":"https://www.wikidata.org/wiki/Q379784","display_name":"Arousal","level":2,"score":0.26820001006126404},{"id":"https://openalex.org/C64357122","wikidata":"https://www.wikidata.org/wiki/Q1149766","display_name":"Causality (physics)","level":2,"score":0.2637999951839447},{"id":"https://openalex.org/C2778143943","wikidata":"https://www.wikidata.org/wiki/Q523747","display_name":"Expressed emotion","level":2,"score":0.25540000200271606}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:unsworks.library.unsw.edu.au:1959.4/103386","is_oa":true,"landing_page_url":"http://hdl.handle.net/1959.4/103386","pdf_url":null,"source":{"id":"https://openalex.org/S4306401737","display_name":"UNSWorks (University of New South Wales, Sydney, Australia)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I40053085","host_organization_name":"Australian Defence Force Academy","host_organization_lineage":["https://openalex.org/I40053085"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"http://purl.org/coar/resource_type/c_db06"},{"id":"doi:10.26190/unsworks/30630","is_oa":true,"landing_page_url":"https://doi.org/10.26190/unsworks/30630","pdf_url":null,"source":{"id":"https://openalex.org/S7407053176","display_name":"University of New South Wales","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Dissertation"}],"best_oa_location":{"id":"pmh:oai:unsworks.library.unsw.edu.au:1959.4/103386","is_oa":true,"landing_page_url":"http://hdl.handle.net/1959.4/103386","pdf_url":null,"source":{"id":"https://openalex.org/S4306401737","display_name":"UNSWorks (University of New South Wales, Sydney, Australia)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I40053085","host_organization_name":"Australian Defence Force Academy","host_organization_lineage":["https://openalex.org/I40053085"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"http://purl.org/coar/resource_type/c_db06"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Speech":[0],"emotion":[1,18,118,158,233,246,264,277,285,322,330,350,398],"recognition":[2],"(SER)":[3],"plays":[4],"a":[5,106,313,365,389,401,429],"pivotal":[6],"role":[7],"in":[8,21,39,65,93,117,157,321,338,404],"human-computer":[9,383],"interaction":[10],"(HCI).":[11],"The":[12,260,407],"ability":[13],"to":[14,37,50,61,67,87,185,218,335,346,447],"perceive":[15,47,101],"and":[16,28,48,53,100,131,154,162,169,176,183,192,206,244,257,295,301,305,352,371,381,392,436],"understand":[17],"is":[19,138,216,248],"crucial":[20,107],"effective":[22,382],"human":[23,181,339],"communication.":[24],"However,":[25,121],"emotional":[26,95,208,369],"experience":[27],"expression":[29],"are":[30,42,266,344],"inherently":[31],"heterogeneous":[32],"across":[33,298],"different":[34,439],"individuals,":[35],"leading":[36],"ambiguity":[38,153,286,320],"how":[40,242,354],"emotions":[41,52,102,130,294],"perceived.":[43],"While":[44],"humans":[45],"naturally":[46],"response":[49],"both":[51,129,160,299],"their":[54,132],"associated":[55,133],"ambiguities,":[56,85],"machines":[57],"must":[58],"also":[59,283],"learn":[60],"replicate":[62],"this":[63,142,145,326,386],"capacity":[64],"order":[66],"achieve":[68],"natural":[69,94,380],"HCI":[70],"that":[71,201,224,263],"closely":[72,178],"resembles":[73],"human-human":[74],"interactions.":[75,384],"Despite":[76],"this,":[77,237],"most":[78],"existing":[79],"SER":[80,110,308],"systems":[81,309],"often":[82],"overlook":[83],"these":[84],"failing":[86],"capture":[88,336],"the":[89,114,139,148,152,166,231,238,252,318,348,373,396,405,411,418,433],"subtle":[90],"nuances":[91],"present":[92],"expression.":[96],"Humans":[97],"continuously":[98],"express":[99],"during":[103],"interactions,":[104],"introducing":[105],"element":[108],"for":[109,275,395],"system":[111],"design":[112],"-":[113],"continuous":[115,167],"change":[116,356],"over":[119,135,357],"time.":[120],"limited":[122],"research":[123],"has":[124],"been":[125],"conducted":[126],"on":[127,236,312],"modelling":[128,151,276],"ambiguities":[134],"time,":[136],"which":[137],"focus":[140],"of":[141,150,197,255,293,368,375,432,441],"thesis.":[143],"Specifically,":[144],"thesis":[146,190,239,282,387],"addresses":[147],"challenges":[149],"temporal":[155],"dynamics":[156,278],"using":[159,279,287,332],"ordinal":[161,198,213,232],"numerical":[163,288],"representations":[164],"within":[165],"arousal":[168],"valence":[170],"spaces.":[171],"Ordinal":[172],"labels":[173,422],"involve":[174],"comparisons":[175],"preferences,":[177],"align":[179],"with":[180,221,421],"cognition":[182],"tend":[184],"yield":[186],"lower":[187],"ambiguity.":[188],"This":[189,281],"distinguishes":[191],"introduces":[193,388],"two":[194],"distinct":[195],"types":[196,440],"labels,":[199],"discovering":[200],"each":[202],"type":[203],"reflects":[204],"static":[205,243],"dynamic":[207,226,245],"information.":[209],"A":[210],"novel":[211,342],"dynamical":[212],"Markovian":[214],"framework":[215],"proposed":[217,345,408],"integrate":[219],"them,":[220],"results":[222],"showing":[223],"incorporating":[225],"information":[227,247],"can":[228],"significantly":[229],"enhance":[230,372],"modelling.":[234],"Building":[235],"further":[240],"investigates":[241],"captured":[249,268],"by":[250,269],"assessing":[251],"relative":[253],"salience":[254],"audio":[256,270],"video":[258],"cues.":[259],"analysis":[261],"suggests":[262],"changes":[265],"better":[267],"modality,":[271],"providing":[272],"valuable":[273],"sights":[274],"speech.":[280],"models":[284],"representations,":[289],"enabling":[290],"broader":[291],"descriptions":[292],"capturing":[296,428],"continuity":[297],"time":[300,358],"affect":[302],"dimensions":[303],"(arousal":[304],"valence).":[306],"Traditional":[307],"typically":[310],"rely":[311],"single":[314],"mean":[315],"prediction,":[316],"disregarding":[317],"inherent":[319],"perception.":[323,340],"In":[324],"contrast,":[325],"work":[327],"develops":[328],"ambiguity-aware":[329,349,397],"states":[331,351],"probability":[333],"distributions":[334],"variations":[337],"Two":[341],"frameworks":[343],"characterise":[347],"model":[353],"they":[355],"as":[359],"time-varying":[360],"distributions.":[361],"These":[362],"approaches":[363],"facilitate":[364],"deep":[366],"understanding":[367],"fluctuations":[370],"detection":[374],"ambiguous":[376],"emotions,":[377],"fostering":[378],"more":[379,444],"Finally,":[385],"novel,":[390],"interpretable":[391],"quantitative":[393],"measure":[394],"predictions,":[399],"addressing":[400],"notable":[402],"gap":[403],"literature.":[406],"metric,":[409],"called":[410],"Belief":[412],"Mismatch":[413],"Coefficient":[414],"(BMC),":[415],"directly":[416],"compares":[417],"predicted":[419,434],"distribution":[420,435],"collected":[423],"from":[424],"multiple":[425],"annotators,":[426],"efficiently":[427],"comprehensive":[430],"view":[431],"distinguishing":[437],"between":[438],"prediction":[442],"errors":[443],"effectively":[445],"compared":[446],"traditional":[448],"metrics.":[449]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2025-10-10T00:00:00"}
