{"id":"https://openalex.org/W4283704748","doi":"https://doi.org/10.21437/interspeech.2022-712","title":"Conformer Based Elderly Speech Recognition System for Alzheimer\u2019s Disease Detection","display_name":"Conformer Based Elderly Speech Recognition System for Alzheimer\u2019s Disease Detection","publication_year":2022,"publication_date":"2022-09-16","ids":{"openalex":"https://openalex.org/W4283704748","doi":"https://doi.org/10.21437/interspeech.2022-712"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2022-712","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2022-712","pdf_url":null,"source":{"id":"https://openalex.org/S4363604309","display_name":"Interspeech 2022","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2022","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5106407750","display_name":"Tianzi Wang","orcid":"https://orcid.org/0009-0005-5823-3039"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Tianzi Wang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5106406454","display_name":"Jiajun Deng","orcid":"https://orcid.org/0000-0001-8874-4167"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiajun Deng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003895235","display_name":"Mengzhe Geng","orcid":"https://orcid.org/0000-0002-7886-439X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mengzhe Geng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100341722","display_name":"Zi Ye","orcid":"https://orcid.org/0000-0003-1002-0315"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zi Ye","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045355404","display_name":"Shoukang Hu","orcid":"https://orcid.org/0000-0002-3345-6923"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shoukang Hu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100364982","display_name":"Yi Wang","orcid":"https://orcid.org/0000-0002-8448-8570"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yi Wang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100938995","display_name":"Mingyu Cui","orcid":"https://orcid.org/0000-0002-2672-2461"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mingyu Cui","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075023049","display_name":"Zengrui Jin","orcid":"https://orcid.org/0000-0002-2637-7880"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zengrui Jin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037109470","display_name":"Xunying Liu","orcid":"https://orcid.org/0000-0001-6725-1160"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xunying Liu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5019458385","display_name":"Helen Meng","orcid":"https://orcid.org/0000-0002-4427-3532"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Helen Meng","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":10,"corresponding_author_ids":["https://openalex.org/A5106407750"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.7893,"has_fulltext":false,"cited_by_count":18,"citation_normalized_percentile":{"value":0.86902364,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"4825","last_page":"4829"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9869999885559082,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9869999885559082,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7622231245040894},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6906383633613586},{"id":"https://openalex.org/keywords/word-error-rate","display_name":"Word error rate","score":0.6021637320518494},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4956287145614624},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.46793004870414734},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4656648635864258},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.465164452791214},{"id":"https://openalex.org/keywords/test-set","display_name":"Test set","score":0.4477599859237671},{"id":"https://openalex.org/keywords/domain-adaptation","display_name":"Domain adaptation","score":0.44394952058792114},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4306301474571228},{"id":"https://openalex.org/keywords/residual-neural-network","display_name":"Residual neural network","score":0.41663578152656555}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7622231245040894},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6906383633613586},{"id":"https://openalex.org/C40969351","wikidata":"https://www.wikidata.org/wiki/Q3516228","display_name":"Word error rate","level":2,"score":0.6021637320518494},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4956287145614624},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.46793004870414734},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4656648635864258},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.465164452791214},{"id":"https://openalex.org/C169903167","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Test set","level":2,"score":0.4477599859237671},{"id":"https://openalex.org/C2776434776","wikidata":"https://www.wikidata.org/wiki/Q19246213","display_name":"Domain adaptation","level":3,"score":0.44394952058792114},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4306301474571228},{"id":"https://openalex.org/C2944601119","wikidata":"https://www.wikidata.org/wiki/Q43744058","display_name":"Residual neural network","level":3,"score":0.41663578152656555},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.21437/interspeech.2022-712","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2022-712","pdf_url":null,"source":{"id":"https://openalex.org/S4363604309","display_name":"Interspeech 2022","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2022","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.4000000059604645,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4394775207","https://openalex.org/W4382052965","https://openalex.org/W2145230572","https://openalex.org/W2166312020","https://openalex.org/W4387090791","https://openalex.org/W4401751953","https://openalex.org/W2914064142","https://openalex.org/W156567445","https://openalex.org/W3136989387","https://openalex.org/W4287266619"],"abstract_inverted_index":{"Early":[0],"diagnosis":[1],"of":[2,21,59,70,106,117,139],"Alzheimer's":[3],"disease":[4],"(AD)":[5],"is":[6,52],"crucial":[7],"in":[8,74],"facilitating":[9],"preventive":[10],"care":[11],"to":[12,76,127],"delay":[13],"further":[14],"progression.":[15],"This":[16],"paper":[17],"presents":[18],"the":[19,31,114,122,131],"development":[20],"a":[22,57],"state-of-the-art":[23],"Conformer":[24,41,72],"based":[25,49,68,93,135],"speech":[26,133],"recognition":[27,125,134],"system":[28,42],"built":[29],"on":[30,113],"DementiaBank":[32],"Pitt":[33],"corpus":[34],"for":[35],"automatic":[36],"AD":[37,136],"detection.":[38],"The":[39],"baseline":[40],"trained":[43],"with":[44,95],"speed":[45],"perturbation":[46],"and":[47,89],"SpecAugment":[48],"data":[50,116],"augmentation":[51],"significantly":[53],"improved":[54],"by":[55],"incorporating":[56],"set":[58],"purposefully":[60],"designed":[61],"modeling":[62],"features,":[63,130],"including":[64],"neural":[65],"architecture":[66],"search":[67],"auto-configuration":[69],"domain-specific":[71],"hyper-parameters":[73],"addition":[75],"parameter":[77],"fine-tuning;":[78],"fine-grained":[79],"elderly":[80,119],"speaker":[81],"adaptation":[82],"using":[83],"learning":[84],"hidden":[85],"unit":[86],"contributions":[87],"(LHUC);":[88],"two-pass":[90],"cross-system":[91],"rescoring":[92],"combination":[94],"hybrid":[96],"TDNN":[97],"systems.":[98],"An":[99],"overall":[100],"word":[101],"error":[102],"rate":[103],"(WER)":[104],"reduction":[105],"13.6%":[107],"absolute":[108],"(34.8%":[109],"relative)":[110],"was":[111,141],"obtained":[112],"evaluation":[115],"48":[118],"speakers.":[120],"Using":[121],"final":[123],"systems'":[124],"outputs":[126],"extract":[128],"textual":[129],"best-published":[132],"detection":[137],"accuracy":[138],"91.7%":[140],"obtained.":[142]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":8},{"year":2023,"cited_by_count":4}],"updated_date":"2026-03-06T13:50:29.536080","created_date":"2025-10-10T00:00:00"}
