{"id":"https://openalex.org/W4408353607","doi":"https://doi.org/10.1109/icassp49660.2025.10890111","title":"Using Corrected ASR Projection to Improve AD Recognition Performance from Spontaneous Speech","display_name":"Using Corrected ASR Projection to Improve AD Recognition Performance from Spontaneous Speech","publication_year":2025,"publication_date":"2025-03-12","ids":{"openalex":"https://openalex.org/W4408353607","doi":"https://doi.org/10.1109/icassp49660.2025.10890111"},"language":"en","primary_location":{"id":"doi:10.1109/icassp49660.2025.10890111","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10890111","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100749834","display_name":"Yunfan Zhang","orcid":"https://orcid.org/0000-0001-5927-7109"},"institutions":[{"id":"https://openalex.org/I118574674","display_name":"Jiangsu Normal University","ror":"https://ror.org/051hvcm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I118574674"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yunfan Zhang","raw_affiliation_strings":["JiangSu Normal University,School of Physics and Electronic Engineering,Xuzhou,China"],"affiliations":[{"raw_affiliation_string":"JiangSu Normal University,School of Physics and Electronic Engineering,Xuzhou,China","institution_ids":["https://openalex.org/I118574674"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112651363","display_name":"Yun Jin","orcid":null},"institutions":[{"id":"https://openalex.org/I118574674","display_name":"Jiangsu Normal University","ror":"https://ror.org/051hvcm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I118574674"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yun Jin","raw_affiliation_strings":["JiangSu Normal University,School of Physics and Electronic Engineering,Xuzhou,China"],"affiliations":[{"raw_affiliation_string":"JiangSu Normal University,School of Physics and Electronic Engineering,Xuzhou,China","institution_ids":["https://openalex.org/I118574674"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102970671","display_name":"Guanlin Chen","orcid":"https://orcid.org/0009-0004-4735-0582"},"institutions":[{"id":"https://openalex.org/I118574674","display_name":"Jiangsu Normal University","ror":"https://ror.org/051hvcm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I118574674"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guanlin Chen","raw_affiliation_strings":["JiangSu Normal University,School of Physics and Electronic Engineering,Xuzhou,China"],"affiliations":[{"raw_affiliation_string":"JiangSu Normal University,School of Physics and Electronic Engineering,Xuzhou,China","institution_ids":["https://openalex.org/I118574674"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112033291","display_name":"Yong Ma","orcid":null},"institutions":[{"id":"https://openalex.org/I118574674","display_name":"Jiangsu Normal University","ror":"https://ror.org/051hvcm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I118574674"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yong Ma","raw_affiliation_strings":["JiangSu Normal University,School of Linguistic Sciences and Arts,Xuzhou,China"],"affiliations":[{"raw_affiliation_string":"JiangSu Normal University,School of Linguistic Sciences and Arts,Xuzhou,China","institution_ids":["https://openalex.org/I118574674"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000601742","display_name":"Maoshen Jia","orcid":"https://orcid.org/0000-0002-3452-3913"},"institutions":[{"id":"https://openalex.org/I37796252","display_name":"Beijing University of Technology","ror":"https://ror.org/037b1pp87","country_code":"CN","type":"education","lineage":["https://openalex.org/I37796252"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Maoshen Jia","raw_affiliation_strings":["Beijing University of Technology,Faculty of Information Technology,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Beijing University of Technology,Faculty of Information Technology,Beijing,China","institution_ids":["https://openalex.org/I37796252"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5043275789","display_name":"Peng Song","orcid":"https://orcid.org/0000-0003-2734-2783"},"institutions":[{"id":"https://openalex.org/I18452120","display_name":"Yantai University","ror":"https://ror.org/01rp41m56","country_code":"CN","type":"education","lineage":["https://openalex.org/I18452120"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Peng Song","raw_affiliation_strings":["Yantai University,School of Computer and Control Engineering,Yantai,China"],"affiliations":[{"raw_affiliation_string":"Yantai University,School of Computer and Control Engineering,Yantai,China","institution_ids":["https://openalex.org/I18452120"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5100749834"],"corresponding_institution_ids":["https://openalex.org/I118574674"],"apc_list":null,"apc_paid":null,"fwci":6.9508,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.96039377,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9890000224113464,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9890000224113464,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9872000217437744,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11447","display_name":"Blind Source Separation Techniques","score":0.9164999723434448,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.7541277408599854},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7211448550224304},{"id":"https://openalex.org/keywords/projection","display_name":"Projection (relational algebra)","score":0.5058924555778503},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.36569732427597046},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.062919020652771}],"concepts":[{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7541277408599854},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7211448550224304},{"id":"https://openalex.org/C57493831","wikidata":"https://www.wikidata.org/wiki/Q3134666","display_name":"Projection (relational algebra)","level":2,"score":0.5058924555778503},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.36569732427597046},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.062919020652771}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp49660.2025.10890111","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10890111","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":17,"referenced_works":["https://openalex.org/W1566256432","https://openalex.org/W1853705225","https://openalex.org/W2407894931","https://openalex.org/W2597672453","https://openalex.org/W2801987007","https://openalex.org/W2909351650","https://openalex.org/W2991435809","https://openalex.org/W3096912371","https://openalex.org/W3097779478","https://openalex.org/W3161873458","https://openalex.org/W3163826605","https://openalex.org/W3209641573","https://openalex.org/W4283717314","https://openalex.org/W4285294723","https://openalex.org/W4286769904","https://openalex.org/W4402111730","https://openalex.org/W4402112421"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"Alzheimer's":[0],"Disease":[1],"patients":[2],"often":[3],"exhibit":[4],"cognitive":[5],"decline,":[6],"with":[7,110,134],"language":[8,25,47],"impairment":[9],"being":[10],"a":[11,18],"prominent":[12],"biomarker.":[13],"Spontaneous":[14],"speech":[15],"analysis":[16],"provides":[17],"non-invasive":[19],"screening":[20],"approach":[21],"for":[22,29,131],"AD.":[23],"Large":[24],"models,":[26],"increasingly":[27],"employed":[28],"textual":[30,87],"feature":[31,62,108,115],"extraction,":[32],"show":[33],"potential":[34],"in":[35,49],"early":[36],"AD":[37,50,132],"prediction.":[38],"However,":[39],"Automatic":[40],"Speech":[41],"Recognition":[42],"transcription":[43,107,114],"errors,":[44],"stemming":[45],"from":[46],"impairments":[48],"and":[51,85,96],"Mild":[52],"Cognitive":[53],"Impairment":[54],"patients,":[55],"can":[56],"lead":[57],"to":[58],"information":[59],"loss":[60],"during":[61],"extraction.":[63],"To":[64],"mitigate":[65],"this,":[66],"we":[67],"introduce":[68],"the":[69,105,111,119,125,135],"Corrected":[70],"ASR":[71,106,113],"Projecting,":[72],"CAP":[73,99,126],"model.":[74],"During":[75],"training,":[76],"ASR-transcribed":[77],"text":[78],"is":[79,101],"manually":[80],"corrected":[81,112],"one":[82],"by":[83,103],"one,":[84],"then":[86],"features":[88],"are":[89],"extracted":[90],"independently":[91],"using":[92],"BERT,":[93],"Claude,":[94],"GLM,":[95],"GPT-3.":[97],"The":[98],"model":[100,127],"trained":[102],"aligning":[104],"space":[109],"space.":[116],"Experiments":[117],"on":[118],"NCMMSC":[120],"2021":[121],"dataset":[122],"demonstrate":[123],"that":[124],"improves":[128],"classification":[129],"performance":[130],"recognition,":[133],"maximum":[136],"accuracy":[137],"improvement":[138],"reaching":[139],"5.55%.":[140]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-13T07:58:08.660418","created_date":"2025-10-10T00:00:00"}
