{"id":"https://openalex.org/W4283718561","doi":"https://doi.org/10.1109/codit55151.2022.9803962","title":"On the use of Deep Learning and Scattering Transform for Pathological voices recognition","display_name":"On the use of Deep Learning and Scattering Transform for Pathological voices recognition","publication_year":2022,"publication_date":"2022-05-17","ids":{"openalex":"https://openalex.org/W4283718561","doi":"https://doi.org/10.1109/codit55151.2022.9803962"},"language":"en","primary_location":{"id":"doi:10.1109/codit55151.2022.9803962","is_oa":false,"landing_page_url":"https://doi.org/10.1109/codit55151.2022.9803962","pdf_url":null,"source":{"id":"https://openalex.org/S4363607900","display_name":"2022 8th International Conference on Control, Decision and Information Technologies (CoDIT)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 8th International Conference on Control, Decision and Information Technologies (CoDIT)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5056860576","display_name":"Sameh Souli","orcid":null},"institutions":[{"id":"https://openalex.org/I63596082","display_name":"Tunis El Manar University","ror":"https://ror.org/029cgt552","country_code":"TN","type":"education","lineage":["https://openalex.org/I63596082"]},{"id":"https://openalex.org/I2800887215","display_name":"Tunisia Polytechnic School","ror":"https://ror.org/00dse3307","country_code":"TN","type":"education","lineage":["https://openalex.org/I2800887215"]}],"countries":["TN"],"is_corresponding":true,"raw_author_name":"S. Souli","raw_affiliation_strings":["University Tunis El-Manar,Faculty of Sciences of Tunis,Tunis,Tunisia,2092","Polytech Innovation LAB (PI-LAB), Private International Polytechnic School of Tunis, Tunisia"],"affiliations":[{"raw_affiliation_string":"University Tunis El-Manar,Faculty of Sciences of Tunis,Tunis,Tunisia,2092","institution_ids":["https://openalex.org/I63596082"]},{"raw_affiliation_string":"Polytech Innovation LAB (PI-LAB), Private International Polytechnic School of Tunis, Tunisia","institution_ids":["https://openalex.org/I2800887215"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043848334","display_name":"Rim Amami","orcid":"https://orcid.org/0000-0002-3507-8428"},"institutions":[{"id":"https://openalex.org/I76571253","display_name":"Imam Abdulrahman Bin Faisal University","ror":"https://ror.org/038cy8j79","country_code":"SA","type":"education","lineage":["https://openalex.org/I76571253"]}],"countries":["SA"],"is_corresponding":false,"raw_author_name":"R. Amami","raw_affiliation_strings":["Imam AbdulRahman bin Faisal University,Computer Science Department,Dammam,Saudi Arabia","Computer Science Department, Imam AbdulRahman bin Faisal University, Dammam, Saudi Arabia"],"affiliations":[{"raw_affiliation_string":"Imam AbdulRahman bin Faisal University,Computer Science Department,Dammam,Saudi Arabia","institution_ids":["https://openalex.org/I76571253"]},{"raw_affiliation_string":"Computer Science Department, Imam AbdulRahman bin Faisal University, Dammam, Saudi Arabia","institution_ids":["https://openalex.org/I76571253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110920074","display_name":"A. Soltani","orcid":null},"institutions":[{"id":"https://openalex.org/I4210131288","display_name":"National Engineering School of Tunis","ror":"https://ror.org/03b1zjt31","country_code":"TN","type":"education","lineage":["https://openalex.org/I4210131288","https://openalex.org/I63596082"]}],"countries":["TN"],"is_corresponding":false,"raw_author_name":"A. Soltani","raw_affiliation_strings":["University of Tunis L.R: LATICE Tunis,National Superior School of Engineering,Tunis,1008"],"affiliations":[{"raw_affiliation_string":"University of Tunis L.R: LATICE Tunis,National Superior School of Engineering,Tunis,1008","institution_ids":["https://openalex.org/I4210131288"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5070511935","display_name":"Sadok Ben Yahia","orcid":"https://orcid.org/0000-0001-8939-8948"},"institutions":[{"id":"https://openalex.org/I63596082","display_name":"Tunis El Manar University","ror":"https://ror.org/029cgt552","country_code":"TN","type":"education","lineage":["https://openalex.org/I63596082"]}],"countries":["TN"],"is_corresponding":false,"raw_author_name":"S. Ben Yahia","raw_affiliation_strings":["University Tunis El-Manar,Faculty of Sciences of Tunis,Tunis,Tunisia,2092"],"affiliations":[{"raw_affiliation_string":"University Tunis El-Manar,Faculty of Sciences of Tunis,Tunis,Tunisia,2092","institution_ids":["https://openalex.org/I63596082"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5056860576"],"corresponding_institution_ids":["https://openalex.org/I2800887215","https://openalex.org/I63596082"],"apc_list":null,"apc_paid":null,"fwci":0.1227,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.22180095,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"2","issue":null,"first_page":"1055","last_page":"1058"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.8838281631469727},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.819572925567627},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.7698023319244385},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7349637746810913},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7198585271835327},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.690624475479126},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5972399711608887},{"id":"https://openalex.org/keywords/wavelet-transform","display_name":"Wavelet transform","score":0.5767021179199219},{"id":"https://openalex.org/keywords/wavelet","display_name":"Wavelet","score":0.5424145460128784},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.521632969379425}],"concepts":[{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.8838281631469727},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.819572925567627},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.7698023319244385},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7349637746810913},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7198585271835327},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.690624475479126},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5972399711608887},{"id":"https://openalex.org/C196216189","wikidata":"https://www.wikidata.org/wiki/Q2867","display_name":"Wavelet transform","level":3,"score":0.5767021179199219},{"id":"https://openalex.org/C47432892","wikidata":"https://www.wikidata.org/wiki/Q831390","display_name":"Wavelet","level":2,"score":0.5424145460128784},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.521632969379425},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/codit55151.2022.9803962","is_oa":false,"landing_page_url":"https://doi.org/10.1109/codit55151.2022.9803962","pdf_url":null,"source":{"id":"https://openalex.org/S4363607900","display_name":"2022 8th International Conference on Control, Decision and Information Technologies (CoDIT)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 8th International Conference on Control, Decision and Information Technologies (CoDIT)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7099999785423279,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W1994906459","https://openalex.org/W2055332436","https://openalex.org/W2072072671","https://openalex.org/W2076063813","https://openalex.org/W2093231248","https://openalex.org/W2100495367","https://openalex.org/W2108598243","https://openalex.org/W2120480077","https://openalex.org/W2122410667","https://openalex.org/W2124537004","https://openalex.org/W2133257461","https://openalex.org/W2139252078","https://openalex.org/W2147768505","https://openalex.org/W2163605009","https://openalex.org/W2165806037","https://openalex.org/W2385755489","https://openalex.org/W2404938947","https://openalex.org/W2511310340","https://openalex.org/W2609527102","https://openalex.org/W2791062765","https://openalex.org/W3134969951","https://openalex.org/W4231109964","https://openalex.org/W4301383669","https://openalex.org/W6679718588","https://openalex.org/W6713805741"],"related_works":["https://openalex.org/W2965546495","https://openalex.org/W4389116644","https://openalex.org/W2153315159","https://openalex.org/W3103844505","https://openalex.org/W4312417841","https://openalex.org/W3193565141","https://openalex.org/W3133861977","https://openalex.org/W3167935049","https://openalex.org/W3029198973","https://openalex.org/W2077021924"],"abstract_inverted_index":{"In":[0],"the":[1,20,83,109,114,117,138],"last":[2],"few":[3],"decades,":[4],"Deep":[5,25],"Neural":[6,27,61],"Networks":[7],"(DNNs)":[8],"has":[9],"shown":[10],"outstanding":[11],"performance":[12,131],"in":[13,46,75,120],"speech":[14,47,76],"recognition":[15,145],"applications.":[16],"We":[17,112],"demonstrate":[18],"that":[19,127],"improved":[21],"accuracy":[22],"obtained":[23],"by":[24],"Convolutional":[26,60],"Network":[28,62],"(DCNN)":[29],"arose":[30],"from":[31],"their":[32],"capacity":[33],"to":[34,41,65,81,107],"extract":[35],"discriminative":[36],"representations":[37],"which":[38],"are":[39,101],"robust":[40],"various":[42],"sources":[43],"of":[44,73,116,144],"variability":[45],"signals.":[48],"By":[49],"this":[50],"study,":[51],"we":[52],"propose":[53],"a":[54],"new":[55],"algorithm,":[56],"named":[57],"Scattering":[58],"Transform-Deep":[59],"CNN:":[63],"ST-DCNN":[64],"identify":[66],"normal":[67],"and":[68,135],"pathological":[69,88],"voices.":[70],"The":[71,91,123],"effectiveness":[72],"advances":[74],"features":[77,100],"have":[78],"been":[79],"proven":[80],"be":[82],"root":[84],"for":[85],"an":[86],"efficient":[87],"voices":[89,110],"classification.":[90],"proposed":[92,118],"algorithm":[93],"involved":[94],"two":[95],"stages:":[96],"First,":[97],"scatter":[98],"wavelet":[99,134],"extracted.":[102],"Then,":[103],"DCNN":[104,136],"is":[105],"used":[106],"classify":[108],"samples.":[111],"evaluated":[113],"robustness":[115],"system":[119],"silent":[121],"environments.":[122],"experimental":[124],"results":[125],"indicates":[126],"it":[128],"achieves":[129],"better":[130],"with":[132,137],"scattering":[133],"clean":[139],"data":[140],"within":[141],"99.62":[142],"%":[143],"rate.":[146]},"counts_by_year":[{"year":2023,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
