{"id":"https://openalex.org/W3196761683","doi":"https://doi.org/10.21437/interspeech.2021-1288","title":"Late Fusion of the Available Lexicon and Raw Waveform-Based Acoustic Modeling for Depression and Dementia Recognition","display_name":"Late Fusion of the Available Lexicon and Raw Waveform-Based Acoustic Modeling for Depression and Dementia Recognition","publication_year":2021,"publication_date":"2021-08-27","ids":{"openalex":"https://openalex.org/W3196761683","doi":"https://doi.org/10.21437/interspeech.2021-1288","mag":"3196761683"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2021-1288","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2021-1288","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2021","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://infoscience.epfl.ch/record/296847","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5075765823","display_name":"Esa\u00fa Villatoro-Tello","orcid":"https://orcid.org/0000-0002-1322-0358"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Esa\u00fa Villatoro-Tello","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008235303","display_name":"S. Pavankumar Dubagunta","orcid":"https://orcid.org/0000-0002-4307-8604"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"S. Pavankumar Dubagunta","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090361451","display_name":"Julian Fritsch","orcid":"https://orcid.org/0000-0003-4290-3913"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Julian Fritsch","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058435824","display_name":"Gabriela Ram\u00edrez-de-la-Rosa","orcid":"https://orcid.org/0000-0003-4730-5613"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gabriela Ram\u00edrez-de-la-Rosa","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076409146","display_name":"Petr Motl\u00ed\u010dek","orcid":"https://orcid.org/0000-0001-6467-1119"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Petr Motlicek","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5043551083","display_name":"Mathew Magimai.-Doss","orcid":"https://orcid.org/0000-0002-8714-1409"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mathew Magimai-Doss","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":3.2777,"has_fulltext":false,"cited_by_count":18,"citation_normalized_percentile":{"value":0.92060157,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1927","last_page":"1931"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12488","display_name":"Mental Health via Writing","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11519","display_name":"Digital Mental Health Interventions","score":0.9929999709129333,"subfield":{"id":"https://openalex.org/subfields/3202","display_name":"Applied Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/dementia","display_name":"Dementia","score":0.694365382194519},{"id":"https://openalex.org/keywords/lexicon","display_name":"Lexicon","score":0.6815452575683594},{"id":"https://openalex.org/keywords/waveform","display_name":"Waveform","score":0.6568931937217712},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6417909860610962},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4691449701786041},{"id":"https://openalex.org/keywords/depression","display_name":"Depression (economics)","score":0.4528743028640747},{"id":"https://openalex.org/keywords/sensor-fusion","display_name":"Sensor fusion","score":0.4404492974281311},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.40426743030548096},{"id":"https://openalex.org/keywords/medicine","display_name":"Medicine","score":0.19044244289398193},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.16288819909095764}],"concepts":[{"id":"https://openalex.org/C2779483572","wikidata":"https://www.wikidata.org/wiki/Q83030","display_name":"Dementia","level":3,"score":0.694365382194519},{"id":"https://openalex.org/C2778121359","wikidata":"https://www.wikidata.org/wiki/Q8096","display_name":"Lexicon","level":2,"score":0.6815452575683594},{"id":"https://openalex.org/C197424946","wikidata":"https://www.wikidata.org/wiki/Q1165717","display_name":"Waveform","level":3,"score":0.6568931937217712},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6417909860610962},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4691449701786041},{"id":"https://openalex.org/C2776867660","wikidata":"https://www.wikidata.org/wiki/Q1814941","display_name":"Depression (economics)","level":2,"score":0.4528743028640747},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.4404492974281311},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.40426743030548096},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.19044244289398193},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.16288819909095764},{"id":"https://openalex.org/C139719470","wikidata":"https://www.wikidata.org/wiki/Q39680","display_name":"Macroeconomics","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C554190296","wikidata":"https://www.wikidata.org/wiki/Q47528","display_name":"Radar","level":2,"score":0.0},{"id":"https://openalex.org/C142724271","wikidata":"https://www.wikidata.org/wiki/Q7208","display_name":"Pathology","level":1,"score":0.0},{"id":"https://openalex.org/C2779134260","wikidata":"https://www.wikidata.org/wiki/Q12136","display_name":"Disease","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.21437/interspeech.2021-1288","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2021-1288","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2021","raw_type":"proceedings-article"},{"id":"pmh:oai:infoscience.epfl.ch:296847","is_oa":true,"landing_page_url":"http://infoscience.epfl.ch/record/296847","pdf_url":null,"source":{"id":"https://openalex.org/S4306400487","display_name":"Infoscience (Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"WoS","raw_type":"conference proceedings"}],"best_oa_location":{"id":"pmh:oai:infoscience.epfl.ch:296847","is_oa":true,"landing_page_url":"http://infoscience.epfl.ch/record/296847","pdf_url":null,"source":{"id":"https://openalex.org/S4306400487","display_name":"Infoscience (Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"WoS","raw_type":"conference proceedings"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W2003502731","https://openalex.org/W2058971120","https://openalex.org/W2078396654","https://openalex.org/W2140910804","https://openalex.org/W2252180568","https://openalex.org/W2623779865","https://openalex.org/W2889056793","https://openalex.org/W2895995041","https://openalex.org/W2936879941","https://openalex.org/W2954915517","https://openalex.org/W2963341956","https://openalex.org/W2981677410","https://openalex.org/W3035250245","https://openalex.org/W3097109903","https://openalex.org/W3106912061","https://openalex.org/W3129165846"],"related_works":["https://openalex.org/W2140536630","https://openalex.org/W2391730868","https://openalex.org/W2759814045","https://openalex.org/W2736760277","https://openalex.org/W4386940087","https://openalex.org/W4386931226","https://openalex.org/W2118055728","https://openalex.org/W2184188632","https://openalex.org/W3159089150","https://openalex.org/W1974895211"],"abstract_inverted_index":{"Mental":[0],"disorders,":[1],"e.g.":[2],"depression":[3],"and":[4,24,96,155,159],"dementia,":[5],"are":[6],"categorized":[7],"as":[8,99],"priority":[9],"conditions":[10],"according":[11],"to":[12,42],"the":[13,44,59,80,88,93,128,139,144],"World":[14],"Health":[15],"Organization":[16],"(WHO).":[17],"When":[18],"diagnosing,":[19],"psychologists":[20],"employ":[21],"structured":[22],"questionnaires/interviews,":[23],"different":[25],"cognitive":[26,73],"tests.":[27],"Although":[28],"accurate,":[29],"there":[30],"is":[31,108],"an":[32,150],"increasing":[33],"necessity":[34],"of":[35,67,92,119,146,153],"developing":[36],"digital":[37],"mental":[38],"health":[39],"support":[40],"technologies":[41],"alleviate":[43],"burden":[45],"faced":[46],"by":[47,63,79,110],"professionals.":[48],"In":[49,127],"this":[50],"paper,":[51],"we":[52],"propose":[53],"a":[54,68,72,102,111,130],"multi-modal":[55],"approach":[56],"for":[57,157],"modeling":[58],"communication":[60],"process":[61],"employed":[62],"patients":[64],"being":[65],"part":[66],"clinical":[69],"interview":[70],"or":[71],"test.":[74],"The":[75,105],"language-based":[76],"modality,":[77],"inspired":[78],"Lexical":[81],"Availability":[82],"(LA)":[83],"theory":[84],"from":[85],"psycho-linguistics,":[86],"identifies":[87],"most":[89],"accessible":[90],"vocabulary":[91],"interviewed":[94],"subject":[95],"use":[97],"it":[98],"features":[100],"in":[101],"classification":[103],"process.":[104],"acoustic-based":[106],"modality":[107],"processed":[109],"Convolutional":[112],"Neural":[113],"Network":[114],"(CNN)":[115],"trained":[116],"on":[117,135],"signals":[118],"speech":[120],"that":[121],"predominantly":[122],"contained":[123],"voice":[124],"source":[125],"characteristics.":[126],"end,":[129],"late":[131],"fusion":[132],"technique,":[133],"based":[134],"majority":[136],"voting,":[137],"assigns":[138],"final":[140],"classification.":[141],"Results":[142],"show":[143],"complementarity":[145],"both":[147],"modalities,":[148],"reaching":[149],"overall":[151],"Macro-F1":[152],"84%":[154],"90%":[156],"Depression":[158],"Alzheimer's":[160],"dementia":[161],"respectively.":[162]},"counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":12},{"year":2021,"cited_by_count":4}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
