{"id":"https://openalex.org/W3211189476","doi":"https://doi.org/10.1145/3459637.3481895","title":"AudiBERT","display_name":"AudiBERT","publication_year":2021,"publication_date":"2021-10-26","ids":{"openalex":"https://openalex.org/W3211189476","doi":"https://doi.org/10.1145/3459637.3481895","mag":"3211189476"},"language":"en","primary_location":{"id":"doi:10.1145/3459637.3481895","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3459637.3481895","pdf_url":null,"source":null,"license":"public-domain","license_id":"https://openalex.org/licenses/public-domain","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 30th ACM International Conference on Information &amp; Knowledge Management","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5004427406","display_name":"Ermal Toto","orcid":"https://orcid.org/0000-0001-6709-8071"},"institutions":[{"id":"https://openalex.org/I107077323","display_name":"Worcester Polytechnic Institute","ror":"https://ror.org/05ejpqr48","country_code":"US","type":"education","lineage":["https://openalex.org/I107077323"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Ermal Toto","raw_affiliation_strings":["Worcester Polytechnic Institute, Worcester, MA, USA"],"affiliations":[{"raw_affiliation_string":"Worcester Polytechnic Institute, Worcester, MA, USA","institution_ids":["https://openalex.org/I107077323"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023220887","display_name":"ML Tlachac","orcid":"https://orcid.org/0000-0002-6634-678X"},"institutions":[{"id":"https://openalex.org/I107077323","display_name":"Worcester Polytechnic Institute","ror":"https://ror.org/05ejpqr48","country_code":"US","type":"education","lineage":["https://openalex.org/I107077323"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"ML Tlachac","raw_affiliation_strings":["Worcester Polytechnic Institute, Worcester, MA, USA"],"affiliations":[{"raw_affiliation_string":"Worcester Polytechnic Institute, Worcester, MA, USA","institution_ids":["https://openalex.org/I107077323"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5008269094","display_name":"Elke A. Rundensteiner","orcid":"https://orcid.org/0000-0001-5375-9254"},"institutions":[{"id":"https://openalex.org/I107077323","display_name":"Worcester Polytechnic Institute","ror":"https://ror.org/05ejpqr48","country_code":"US","type":"education","lineage":["https://openalex.org/I107077323"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Elke A. Rundensteiner","raw_affiliation_strings":["Worcester Polytechnic Institute, Worcester, MA, USA"],"affiliations":[{"raw_affiliation_string":"Worcester Polytechnic Institute, Worcester, MA, USA","institution_ids":["https://openalex.org/I107077323"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5004427406"],"corresponding_institution_ids":["https://openalex.org/I107077323"],"apc_list":null,"apc_paid":null,"fwci":7.1816,"has_fulltext":false,"cited_by_count":54,"citation_normalized_percentile":{"value":0.97432759,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"4145","last_page":"4154"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12488","display_name":"Mental Health via Writing","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12488","display_name":"Mental Health via Writing","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10863","display_name":"Voice and Speech Disorders","score":0.9954000115394592,"subfield":{"id":"https://openalex.org/subfields/2737","display_name":"Physiology"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.995199978351593,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7100580930709839},{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.6791454553604126},{"id":"https://openalex.org/keywords/depression","display_name":"Depression (economics)","score":0.5235633254051208},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.4980430603027344},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.463580846786499},{"id":"https://openalex.org/keywords/mechanism","display_name":"Mechanism (biology)","score":0.41150644421577454},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4108998775482178},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.3306503891944885}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7100580930709839},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.6791454553604126},{"id":"https://openalex.org/C2776867660","wikidata":"https://www.wikidata.org/wiki/Q1814941","display_name":"Depression (economics)","level":2,"score":0.5235633254051208},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4980430603027344},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.463580846786499},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.41150644421577454},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4108998775482178},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3306503891944885},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.0},{"id":"https://openalex.org/C139719470","wikidata":"https://www.wikidata.org/wiki/Q39680","display_name":"Macroeconomics","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3459637.3481895","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3459637.3481895","pdf_url":null,"source":null,"license":"public-domain","license_id":"https://openalex.org/licenses/public-domain","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 30th ACM International Conference on Information &amp; Knowledge Management","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.699999988079071,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W96961569","https://openalex.org/W1494198834","https://openalex.org/W1970578576","https://openalex.org/W1974665640","https://openalex.org/W2003502731","https://openalex.org/W2010817634","https://openalex.org/W2021247507","https://openalex.org/W2051647439","https://openalex.org/W2076444692","https://openalex.org/W2080576537","https://openalex.org/W2099832283","https://openalex.org/W2109636054","https://openalex.org/W2132322340","https://openalex.org/W2144723972","https://openalex.org/W2156104108","https://openalex.org/W2231475797","https://openalex.org/W2250539671","https://openalex.org/W2252180568","https://openalex.org/W2254462287","https://openalex.org/W2291466689","https://openalex.org/W2400334276","https://openalex.org/W2526050071","https://openalex.org/W2529925562","https://openalex.org/W2530421149","https://openalex.org/W2551548999","https://openalex.org/W2626778328","https://openalex.org/W2793141922","https://openalex.org/W2889056793","https://openalex.org/W2889089254","https://openalex.org/W2892181857","https://openalex.org/W2896457183","https://openalex.org/W2910883992","https://openalex.org/W2964308564","https://openalex.org/W2980282514","https://openalex.org/W2981660166","https://openalex.org/W2990138404","https://openalex.org/W3016839817","https://openalex.org/W3099782249","https://openalex.org/W3129219638","https://openalex.org/W4295682739"],"related_works":["https://openalex.org/W2185469136","https://openalex.org/W4306353150","https://openalex.org/W2026860389","https://openalex.org/W2168054807","https://openalex.org/W2382997850","https://openalex.org/W2058990474","https://openalex.org/W2043363698","https://openalex.org/W3207883763","https://openalex.org/W4386977688","https://openalex.org/W4380075502"],"abstract_inverted_index":{"Depression":[0,27],"is":[1],"a":[2,60,83,116,121],"leading":[3],"cause":[4],"of":[5,13,63,93,170,180],"disability":[6],"with":[7,56,134],"tremendous":[8],"socioeconomic":[9],"costs.":[10],"In":[11],"spite":[12],"early":[14],"detection":[15],"being":[16],"crucial":[17],"to":[18,34,51,69,127,145,172],"improving":[19],"prognosis,":[20],"this":[21,40,76],"mental":[22],"illness":[23],"remains":[24],"largely":[25],"undiagnosed.":[26],"classification":[28,67,129],"from":[29,71,158,183],"voice":[30],"holds":[31],"the":[32,90,98,111,178],"promise":[33],"revolutionize":[35],"diagnosis":[36],"by":[37,115],"ubiquitously":[38],"integrating":[39],"screening":[41,182],"capability":[42],"into":[43,120],"virtual":[44],"assistants":[45],"and":[46,106,142,148,161,174],"smartphone":[47],"technologies.":[48,188],"Unfortunately,":[49],"due":[50],"privacy":[52],"concerns,":[53],"audio":[54,105,147],"datasets":[55],"depression":[57,128,181],"labels":[58],"have":[59],"small":[61,99],"number":[62],"participants,":[64],"causing":[65],"current":[66],"models":[68,109,150],"suffer":[70],"low":[72],"performance.":[73],"To":[74,96],"tackle":[75],"challenge,":[77],"we":[78],"introduce":[79],"Audio-Assisted":[80],"BERT":[81],"(AudiBERT),":[82],"novel":[84],"deep":[85,122],"learning":[86,123],"framework":[87,166],"that":[88],"leverages":[89],"multimodal":[91],"nature":[92],"human":[94],"voice.":[95],"alleviate":[97],"data":[100],"problem,":[101],"AudiBERT":[102,125],"integrates":[103],"pretrained":[104],"text":[107,149],"representation":[108],"for":[110,151],"respective":[112],"modalities":[113],"augmented":[114],"dual":[117],"self-attention":[118],"mechanism":[119],"architecture.":[124],"applied":[126],"consistently":[130],"achieves":[131,167],"promising":[132],"performance":[133],"an":[135],"increase":[136],"in":[137],"F1":[138,168],"scores":[139,169],"between":[140],"6%":[141],"30%":[143],"compared":[144],"state-of-the-art":[146],"15":[152],"thematic":[153],"question":[154],"datasets.":[155],"Using":[156],"answers":[157],"medically":[159],"targeted":[160],"general":[162],"wellness":[163],"questions,":[164],"our":[165],"up":[171],"0.92":[173],"0.86,":[175],"respectively,":[176],"demonstrating":[177],"feasibility":[179],"informal":[184],"dialogue":[185],"using":[186],"voice-enabled":[187]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":19},{"year":2024,"cited_by_count":14},{"year":2023,"cited_by_count":9},{"year":2022,"cited_by_count":9},{"year":2021,"cited_by_count":1}],"updated_date":"2026-03-09T08:58:05.943551","created_date":"2021-11-08T00:00:00"}
