{"id":"https://openalex.org/W4388821109","doi":"https://doi.org/10.1109/apsipaasc58517.2023.10317555","title":"Data Selection Based on Phoneme Affinity Matrix for Electrolarynx Speech Recognition","display_name":"Data Selection Based on Phoneme Affinity Matrix for Electrolarynx Speech Recognition","publication_year":2023,"publication_date":"2023-10-31","ids":{"openalex":"https://openalex.org/W4388821109","doi":"https://doi.org/10.1109/apsipaasc58517.2023.10317555"},"language":"en","primary_location":{"id":"doi:10.1109/apsipaasc58517.2023.10317555","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/apsipaasc58517.2023.10317555","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 Asia Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5049205300","display_name":"I-Ting Hsieh","orcid":"https://orcid.org/0009-0001-4446-7476"},"institutions":[{"id":"https://openalex.org/I91807558","display_name":"National Cheng Kung University","ror":"https://ror.org/01b8kcc49","country_code":"TW","type":"education","lineage":["https://openalex.org/I91807558"]}],"countries":["TW"],"is_corresponding":true,"raw_author_name":"I-Ting Hsieh","raw_affiliation_strings":["National Cheng Kung University,Graduate Program of Multimedia Systems and Intelligent Computing,Tainan,Taiwan","Graduate Program of Multimedia Systems and Intelligent Computing, National Cheng Kung University, Tainan, Taiwan"],"affiliations":[{"raw_affiliation_string":"National Cheng Kung University,Graduate Program of Multimedia Systems and Intelligent Computing,Tainan,Taiwan","institution_ids":["https://openalex.org/I91807558"]},{"raw_affiliation_string":"Graduate Program of Multimedia Systems and Intelligent Computing, National Cheng Kung University, Tainan, Taiwan","institution_ids":["https://openalex.org/I91807558"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103251327","display_name":"Chung\u2010Hsien Wu","orcid":"https://orcid.org/0000-0002-3947-2123"},"institutions":[{"id":"https://openalex.org/I91807558","display_name":"National Cheng Kung University","ror":"https://ror.org/01b8kcc49","country_code":"TW","type":"education","lineage":["https://openalex.org/I91807558"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Chung-Hsien Wu","raw_affiliation_strings":["National Cheng Kung University,Graduate Program of Multimedia Systems and Intelligent Computing,Tainan,Taiwan","Graduate Program of Multimedia Systems and Intelligent Computing, National Cheng Kung University, Tainan, Taiwan"],"affiliations":[{"raw_affiliation_string":"National Cheng Kung University,Graduate Program of Multimedia Systems and Intelligent Computing,Tainan,Taiwan","institution_ids":["https://openalex.org/I91807558"]},{"raw_affiliation_string":"Graduate Program of Multimedia Systems and Intelligent Computing, National Cheng Kung University, Tainan, Taiwan","institution_ids":["https://openalex.org/I91807558"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5093294160","display_name":"Shu-Wei Tsa","orcid":null},"institutions":[{"id":"https://openalex.org/I4210158999","display_name":"National Cheng Kung University Hospital","ror":"https://ror.org/04zx3rq17","country_code":"TW","type":"healthcare","lineage":["https://openalex.org/I4210158999"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Shu-Wei Tsa","raw_affiliation_strings":["National Cheng Kung University Hospital,Dept. of Otolaryngology,Taiwan","Dept. of Otolaryngology, National Cheng Kung University Hospital, Taiwan"],"affiliations":[{"raw_affiliation_string":"National Cheng Kung University Hospital,Dept. of Otolaryngology,Taiwan","institution_ids":["https://openalex.org/I4210158999"]},{"raw_affiliation_string":"Dept. of Otolaryngology, National Cheng Kung University Hospital, Taiwan","institution_ids":["https://openalex.org/I4210158999"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5049205300"],"corresponding_institution_ids":["https://openalex.org/I91807558"],"apc_list":null,"apc_paid":null,"fwci":0.1746,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.57697918,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"2196","last_page":"2202"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10863","display_name":"Voice and Speech Disorders","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/2737","display_name":"Physiology"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.775065541267395},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7418814897537231},{"id":"https://openalex.org/keywords/intelligibility","display_name":"Intelligibility (philosophy)","score":0.7198936939239502},{"id":"https://openalex.org/keywords/phone","display_name":"Phone","score":0.589388906955719},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.5697563290596008},{"id":"https://openalex.org/keywords/voice-activity-detection","display_name":"Voice activity detection","score":0.4911758601665497},{"id":"https://openalex.org/keywords/acoustic-model","display_name":"Acoustic model","score":0.47983691096305847},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.4658993184566498},{"id":"https://openalex.org/keywords/speech-corpus","display_name":"Speech corpus","score":0.4467660188674927},{"id":"https://openalex.org/keywords/speech-synthesis","display_name":"Speech synthesis","score":0.4070921540260315},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3544656038284302},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.07421824336051941}],"concepts":[{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.775065541267395},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7418814897537231},{"id":"https://openalex.org/C60048801","wikidata":"https://www.wikidata.org/wiki/Q1433889","display_name":"Intelligibility (philosophy)","level":2,"score":0.7198936939239502},{"id":"https://openalex.org/C2778707766","wikidata":"https://www.wikidata.org/wiki/Q202064","display_name":"Phone","level":2,"score":0.589388906955719},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.5697563290596008},{"id":"https://openalex.org/C204201278","wikidata":"https://www.wikidata.org/wiki/Q1332614","display_name":"Voice activity detection","level":3,"score":0.4911758601665497},{"id":"https://openalex.org/C155635449","wikidata":"https://www.wikidata.org/wiki/Q4674699","display_name":"Acoustic model","level":3,"score":0.47983691096305847},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.4658993184566498},{"id":"https://openalex.org/C91863865","wikidata":"https://www.wikidata.org/wiki/Q4349497","display_name":"Speech corpus","level":3,"score":0.4467660188674927},{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.4070921540260315},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3544656038284302},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.07421824336051941},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/apsipaasc58517.2023.10317555","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/apsipaasc58517.2023.10317555","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 Asia Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.5600000023841858}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":33,"referenced_works":["https://openalex.org/W137929712","https://openalex.org/W1524333225","https://openalex.org/W1596477320","https://openalex.org/W1631260214","https://openalex.org/W2060106308","https://openalex.org/W2091746061","https://openalex.org/W2116593694","https://openalex.org/W2147244000","https://openalex.org/W2187234408","https://openalex.org/W2407080277","https://openalex.org/W2604763608","https://openalex.org/W2888867175","https://openalex.org/W2894877413","https://openalex.org/W2902967674","https://openalex.org/W2913862288","https://openalex.org/W2936774411","https://openalex.org/W2936861580","https://openalex.org/W2972667718","https://openalex.org/W2983434507","https://openalex.org/W2992384298","https://openalex.org/W3010079431","https://openalex.org/W3013967924","https://openalex.org/W3014690389","https://openalex.org/W3015585292","https://openalex.org/W3035268246","https://openalex.org/W3089548201","https://openalex.org/W3096263335","https://openalex.org/W4210590938","https://openalex.org/W4388821498","https://openalex.org/W6605526561","https://openalex.org/W6631362777","https://openalex.org/W6736057607","https://openalex.org/W6791250781"],"related_works":["https://openalex.org/W2081919107","https://openalex.org/W3115948027","https://openalex.org/W2405110677","https://openalex.org/W4387323809","https://openalex.org/W2811496854","https://openalex.org/W4200068392","https://openalex.org/W2772686614","https://openalex.org/W2164829670","https://openalex.org/W2036933852","https://openalex.org/W2152945827"],"abstract_inverted_index":{"Electrolarynx":[0],"(EL)":[1],"is":[2,40,49,92,171],"a":[3,69,142],"communicative":[4],"aid":[5],"for":[6,34,98,163],"the":[7,27,30,38,44,53,77,84,95,100,114,125,128,147,153,174,177,181,185,193,200,210,213,220],"patient":[8,39],"after":[9],"laryngectomy":[10],"to":[11,51,151,208,218],"generate":[12],"communicable":[13],"speech.":[14,89,138],"Since":[15],"EL":[16,45,65,88,117,129,161],"speech":[17,20,31,61,66,104,118,130,157,162,223],"exhibits":[18],"low":[19],"intelligibility":[21],"and":[22,212],"produces":[23],"loud":[24],"noise,":[25],"understanding":[26],"content":[28],"of":[29,64,79,87,94,102,127,136,155,176,180],"remains":[32],"challenging":[33],"listeners,":[35],"even":[36,107],"if":[37],"proficient":[41],"in":[42,73,116],"using":[43,146],"device.":[46],"Accordingly,":[47],"it":[48],"important":[50],"develop":[52],"tools":[54],"that":[55,158,192],"offer":[56],"additional":[57],"communication":[58],"methods.":[59],"Automatic":[60],"recognition":[62,85,119],"(ASR)":[63],"emerges":[67],"as":[68,173],"method":[70,145,214],"worth":[71],"considering":[72,184],"this":[74],"regard.":[75],"However,":[76,106],"problem":[78],"under-resourced":[80,103],"data":[81,143,164,196],"dramatically":[82],"degrades":[83],"performance":[86],"Data":[90],"augmentation":[91],"one":[93],"viable":[96],"solutions":[97],"addressing":[99],"issue":[101],"data.":[105],"with":[108],"an":[109],"increased":[110],"health":[111,137,156,222],"training":[112],"corpus,":[113],"improvement":[115],"may":[120],"not":[121],"be":[122],"satisfactory.":[123],"Because":[124],"characteristics":[126],"still":[131],"differ":[132],"significantly":[133],"from":[134],"those":[135],"This":[139],"paper":[140],"proposes":[141],"selection":[144,154,197],"phoneme":[148,186,201],"affinity":[149,167,202],"matrix":[150,203],"prioritize":[152],"closely":[159],"resembles":[160],"augmentation.":[165],"The":[166,188],"between":[168],"two":[169,182],"phonemes":[170],"defined":[172],"similarity":[175],"Phone":[178],"Posteriorgrams(PPGs)":[179],"phonemes,":[183],"models.":[187],"experimental":[189],"results":[190,206],"demonstrate":[191],"approach":[194],"utilizing":[195],"based":[198],"on":[199],"yields":[204],"superior":[205],"compared":[207],"both":[209],"baseline":[211],"employing":[215],"random":[216],"sampling":[217],"select":[219],"augmented":[221],"corpus.":[224]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-25T23:11:45.687758","created_date":"2025-10-10T00:00:00"}
