{"id":"https://openalex.org/W4386754713","doi":"https://doi.org/10.1007/s10772-023-10042-z","title":"Time frequency domain deep CNN for automatic background classification in speech signals","display_name":"Time frequency domain deep CNN for automatic background classification in speech signals","publication_year":2023,"publication_date":"2023-09-01","ids":{"openalex":"https://openalex.org/W4386754713","doi":"https://doi.org/10.1007/s10772-023-10042-z"},"language":"en","primary_location":{"id":"doi:10.1007/s10772-023-10042-z","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1007/s10772-023-10042-z","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10772-023-10042-z.pdf","source":{"id":"https://openalex.org/S4650632","display_name":"International Journal of Speech Technology","issn_l":"1381-2416","issn":["1381-2416","1572-8110"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Speech Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s10772-023-10042-z.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5041082402","display_name":"Rakesh Reddy Yakkati","orcid":"https://orcid.org/0000-0003-4358-7262"},"institutions":[{"id":"https://openalex.org/I115715567","display_name":"Birla Institute of Technology, Mesra","ror":"https://ror.org/028vtqb15","country_code":"IN","type":"education","lineage":["https://openalex.org/I115715567"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Rakesh Reddy Yakkati","raw_affiliation_strings":["Department of Mathematics, Birla Institute of Technology, Mesra, Jharkhand, 835215, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Mathematics, Birla Institute of Technology, Mesra, Jharkhand, 835215, India","institution_ids":["https://openalex.org/I115715567"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000928969","display_name":"Sreenivasa Reddy Yeduri","orcid":null},"institutions":[{"id":"https://openalex.org/I200650556","display_name":"University of Agder","ror":"https://ror.org/03x297z98","country_code":"NO","type":"education","lineage":["https://openalex.org/I200650556"]}],"countries":["NO"],"is_corresponding":false,"raw_author_name":"Sreenivasa Reddy Yeduri","raw_affiliation_strings":["Department of Information and Communication Technology, University of Agder, Grimstad, Norway"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Information and Communication Technology, University of Agder, Grimstad, Norway","institution_ids":["https://openalex.org/I200650556"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003313501","display_name":"Rajesh Kumar Tripathy","orcid":"https://orcid.org/0000-0003-2517-3103"},"institutions":[{"id":"https://openalex.org/I4210101034","display_name":"Birla Institute of Technology and Science - Hyderabad Campus","ror":"https://ror.org/014ctt859","country_code":"IN","type":"education","lineage":["https://openalex.org/I4210101034","https://openalex.org/I74796645"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Rajesh Kumar Tripathy","raw_affiliation_strings":["Department of Electrical and Electronic Engineering, Birla Institute of Technology, Hyderabad, Telangana, 500078, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Electrical and Electronic Engineering, Birla Institute of Technology, Hyderabad, Telangana, 500078, India","institution_ids":["https://openalex.org/I4210101034"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5014288820","display_name":"Linga Reddy Cenkeramaddi","orcid":"https://orcid.org/0000-0002-1023-2118"},"institutions":[{"id":"https://openalex.org/I200650556","display_name":"University of Agder","ror":"https://ror.org/03x297z98","country_code":"NO","type":"education","lineage":["https://openalex.org/I200650556"]}],"countries":["NO"],"is_corresponding":false,"raw_author_name":"Linga Reddy Cenkeramaddi","raw_affiliation_strings":["Department of Information and Communication Technology, University of Agder, Grimstad, Norway"],"raw_orcid":"https://orcid.org/0000-0002-1023-2118","affiliations":[{"raw_affiliation_string":"Department of Information and Communication Technology, University of Agder, Grimstad, Norway","institution_ids":["https://openalex.org/I200650556"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5041082402"],"corresponding_institution_ids":["https://openalex.org/I115715567"],"apc_list":{"value":2190,"currency":"EUR","value_usd":2780},"apc_paid":{"value":2190,"currency":"EUR","value_usd":2780},"fwci":0.3838,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.56477871,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":95},"biblio":{"volume":"26","issue":"3","first_page":"695","last_page":"706"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9891999959945679,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8900023698806763},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6134647130966187},{"id":"https://openalex.org/keywords/normalization","display_name":"Normalization (sociology)","score":0.5665478706359863},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.5202694535255432},{"id":"https://openalex.org/keywords/pooling","display_name":"Pooling","score":0.5018317699432373},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.48612308502197266},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.428035169839859},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.42691996693611145},{"id":"https://openalex.org/keywords/wavelet","display_name":"Wavelet","score":0.4113408625125885},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4052669107913971}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8900023698806763},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6134647130966187},{"id":"https://openalex.org/C136886441","wikidata":"https://www.wikidata.org/wiki/Q926129","display_name":"Normalization (sociology)","level":2,"score":0.5665478706359863},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.5202694535255432},{"id":"https://openalex.org/C70437156","wikidata":"https://www.wikidata.org/wiki/Q7228652","display_name":"Pooling","level":2,"score":0.5018317699432373},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.48612308502197266},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.428035169839859},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.42691996693611145},{"id":"https://openalex.org/C47432892","wikidata":"https://www.wikidata.org/wiki/Q831390","display_name":"Wavelet","level":2,"score":0.4113408625125885},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4052669107913971},{"id":"https://openalex.org/C19165224","wikidata":"https://www.wikidata.org/wiki/Q23404","display_name":"Anthropology","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s10772-023-10042-z","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1007/s10772-023-10042-z","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10772-023-10042-z.pdf","source":{"id":"https://openalex.org/S4650632","display_name":"International Journal of Speech Technology","issn_l":"1381-2416","issn":["1381-2416","1572-8110"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Speech Technology","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s10772-023-10042-z","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1007/s10772-023-10042-z","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10772-023-10042-z.pdf","source":{"id":"https://openalex.org/S4650632","display_name":"International Journal of Speech Technology","issn_l":"1381-2416","issn":["1381-2416","1572-8110"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Speech Technology","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.8299999833106995,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[{"id":"https://openalex.org/G3320310129","display_name":null,"funder_award_id":"280835","funder_id":"https://openalex.org/F4320323299","funder_display_name":"Norges Forskningsr\u00e5d"},{"id":"https://openalex.org/G7618422984","display_name":null,"funder_award_id":"287918","funder_id":"https://openalex.org/F4320323299","funder_display_name":"Norges Forskningsr\u00e5d"}],"funders":[{"id":"https://openalex.org/F4320323299","display_name":"Norges Forskningsr\u00e5d","ror":"https://ror.org/00epmv149"},{"id":"https://openalex.org/F4320327751","display_name":"Universitetet i Agder","ror":"https://ror.org/03x297z98"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4386754713.pdf"},"referenced_works_count":27,"referenced_works":["https://openalex.org/W1178673422","https://openalex.org/W1966976522","https://openalex.org/W1973399263","https://openalex.org/W1975572074","https://openalex.org/W1983963761","https://openalex.org/W2052666245","https://openalex.org/W2078564204","https://openalex.org/W2090218979","https://openalex.org/W2127737460","https://openalex.org/W2130813098","https://openalex.org/W2151484683","https://openalex.org/W2571764252","https://openalex.org/W2617002574","https://openalex.org/W2678442846","https://openalex.org/W2889495646","https://openalex.org/W2903926094","https://openalex.org/W2962680212","https://openalex.org/W2990035072","https://openalex.org/W3001387854","https://openalex.org/W3005348841","https://openalex.org/W3033761581","https://openalex.org/W3046118769","https://openalex.org/W3113043802","https://openalex.org/W3133500314","https://openalex.org/W3157740661","https://openalex.org/W3200430820","https://openalex.org/W4289336416"],"related_works":["https://openalex.org/W2953234277","https://openalex.org/W2626256601","https://openalex.org/W2900413183","https://openalex.org/W4390975304","https://openalex.org/W147410782","https://openalex.org/W3022252430","https://openalex.org/W3103989898","https://openalex.org/W4287804464","https://openalex.org/W2810679507","https://openalex.org/W2059040236"],"abstract_inverted_index":{"Abstract":[0],"Many":[1],"application":[2],"areas,":[3],"such":[4,146],"as":[5,147],"background":[6,33,44,70,104,140,181],"identification,":[7],"predictive":[8],"maintenance":[9],"in":[10,64,73,107,143,184],"industrial":[11],"applications,":[12,15],"smart":[13],"home":[14],"assisting":[16],"deaf":[17],"people":[18],"with":[19],"their":[20],"daily":[21],"activities":[22],"and":[23,25,128,158],"indexing":[24],"retrieval":[26],"of":[27,115,175,190],"content-based":[28],"multimedia,":[29],"etc.,":[30],"use":[31],"automatic":[32],"classification":[34,173],"using":[35,138],"speech":[36,48,74,87,108,144,185],"signals.":[37,75,88,109,186],"It":[38],"is":[39,62,78,136,194],"challenging":[40],"to":[41,80,95,102,162,179,196],"predict":[42],"the":[43,82,86,163,165,188,191,197],"environment":[45],"accurately":[46],"from":[47,85],"signal":[49],"information.":[50],"Thus,":[51],"a":[52,96],"novel":[53],"synchrosqueezed":[54],"wavelet":[55],"transform":[56],"(SWT)-based":[57],"deep":[58,97],"learning":[59],"(DL)":[60],"approach":[61,169,193],"proposed":[63,111,134,166,192],"this":[65],"paper":[66],"for":[67],"automatically":[68],"classifying":[69],"information":[71,105,182],"embedded":[72,106,142,183],"Here,":[76],"SWT":[77],"incorporated":[79],"obtain":[81],"time-frequency":[83,90],"plot":[84],"These":[89],"signals":[91,141],"are":[92],"then":[93],"fed":[94],"convolutional":[98],"neural":[99],"network":[100],"(DCNN)":[101],"classify":[103,180],"The":[110,133],"DCNN":[112,168],"model":[113],"consists":[114],"three":[116,122],"convolution":[117],"layers,":[118,124],"one":[119,125,129],"batch-normalization":[120],"layer,":[121,127],"max-pooling":[123],"dropout":[126],"fully":[130],"connected":[131],"layer.":[132],"method":[135],"tested":[137],"various":[139],"signals,":[145],"airport,":[148],"airplane,":[149],"drone,":[150],"street,":[151],"babble,":[152],"car,":[153],"helicopter,":[154],"exhibition,":[155],"station,":[156],"restaurant,":[157],"train":[159],"sounds.":[160],"According":[161],"results,":[164],"SWT-based":[167],"has":[170],"an":[171],"overall":[172],"accuracy":[174],"97.96":[176],"(\u00b1":[177],"0.53)%":[178],"Finally,":[187],"performance":[189],"compared":[195],"existing":[198],"methods.":[199]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1}],"updated_date":"2025-12-26T23:08:49.675405","created_date":"2025-10-10T00:00:00"}
