{"id":"https://openalex.org/W3213334936","doi":"https://doi.org/10.1109/icccnt51525.2021.9579778","title":"Deep learning based urban sound classification and ambulance siren detector using spectrogram","display_name":"Deep learning based urban sound classification and ambulance siren detector using spectrogram","publication_year":2021,"publication_date":"2021-07-06","ids":{"openalex":"https://openalex.org/W3213334936","doi":"https://doi.org/10.1109/icccnt51525.2021.9579778","mag":"3213334936"},"language":"en","primary_location":{"id":"doi:10.1109/icccnt51525.2021.9579778","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icccnt51525.2021.9579778","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 12th International Conference on Computing Communication and Networking Technologies (ICCCNT)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5064504769","display_name":"Dipro Pramanick","orcid":null},"institutions":[{"id":"https://openalex.org/I4210104573","display_name":"CMR University","ror":"https://ror.org/015waqy33","country_code":"IN","type":"education","lineage":["https://openalex.org/I4210104573"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Dipro Pramanick","raw_affiliation_strings":["CMR Institute of Technology,Department of Electronics and Communication Engineering,Bangalore,Karnataka,India,560037"],"affiliations":[{"raw_affiliation_string":"CMR Institute of Technology,Department of Electronics and Communication Engineering,Bangalore,Karnataka,India,560037","institution_ids":["https://openalex.org/I4210104573"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050086317","display_name":"Haaris Ansar","orcid":null},"institutions":[{"id":"https://openalex.org/I4210104573","display_name":"CMR University","ror":"https://ror.org/015waqy33","country_code":"IN","type":"education","lineage":["https://openalex.org/I4210104573"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Haaris Ansar","raw_affiliation_strings":["CMR Institute of Technology,Department of Electronics and Communication Engineering,Bangalore,Karnataka,India,560037"],"affiliations":[{"raw_affiliation_string":"CMR Institute of Technology,Department of Electronics and Communication Engineering,Bangalore,Karnataka,India,560037","institution_ids":["https://openalex.org/I4210104573"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055314482","display_name":"Hemant Kumar","orcid":"https://orcid.org/0000-0003-0603-4394"},"institutions":[{"id":"https://openalex.org/I4210104573","display_name":"CMR University","ror":"https://ror.org/015waqy33","country_code":"IN","type":"education","lineage":["https://openalex.org/I4210104573"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Hemant Kumar","raw_affiliation_strings":["CMR Institute of Technology,Department of Electronics and Communication Engineering,Bangalore,Karnataka,India,560037"],"affiliations":[{"raw_affiliation_string":"CMR Institute of Technology,Department of Electronics and Communication Engineering,Bangalore,Karnataka,India,560037","institution_ids":["https://openalex.org/I4210104573"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110945856","display_name":"S Pranav","orcid":null},"institutions":[{"id":"https://openalex.org/I4210104573","display_name":"CMR University","ror":"https://ror.org/015waqy33","country_code":"IN","type":"education","lineage":["https://openalex.org/I4210104573"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"S Pranav","raw_affiliation_strings":["CMR Institute of Technology,Department of Electronics and Communication Engineering,Bangalore,Karnataka,India,560037"],"affiliations":[{"raw_affiliation_string":"CMR Institute of Technology,Department of Electronics and Communication Engineering,Bangalore,Karnataka,India,560037","institution_ids":["https://openalex.org/I4210104573"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048995399","display_name":"Richa Tengshe","orcid":"https://orcid.org/0000-0003-0050-3102"},"institutions":[{"id":"https://openalex.org/I4210104573","display_name":"CMR University","ror":"https://ror.org/015waqy33","country_code":"IN","type":"education","lineage":["https://openalex.org/I4210104573"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Richa Tengshe","raw_affiliation_strings":["CMR Institute of Technology,Department of Electronics and Communication Engineering,Bangalore,Karnataka,India,560037"],"affiliations":[{"raw_affiliation_string":"CMR Institute of Technology,Department of Electronics and Communication Engineering,Bangalore,Karnataka,India,560037","institution_ids":["https://openalex.org/I4210104573"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5046768133","display_name":"Binish Fatimah","orcid":"https://orcid.org/0000-0002-6115-1561"},"institutions":[{"id":"https://openalex.org/I4210104573","display_name":"CMR University","ror":"https://ror.org/015waqy33","country_code":"IN","type":"education","lineage":["https://openalex.org/I4210104573"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Binish Fatimah","raw_affiliation_strings":["CMR Institute of Technology,Department of Electronics and Communication Engineering,Bangalore,Karnataka,India,560037"],"affiliations":[{"raw_affiliation_string":"CMR Institute of Technology,Department of Electronics and Communication Engineering,Bangalore,Karnataka,India,560037","institution_ids":["https://openalex.org/I4210104573"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5064504769"],"corresponding_institution_ids":["https://openalex.org/I4210104573"],"apc_list":null,"apc_paid":null,"fwci":1.2189,"has_fulltext":false,"cited_by_count":15,"citation_normalized_percentile":{"value":0.79763354,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11665","display_name":"Animal Vocal Communication and Behavior","score":0.9842000007629395,"subfield":{"id":"https://openalex.org/subfields/1309","display_name":"Developmental Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/siren","display_name":"Siren (mythology)","score":0.9370377659797668},{"id":"https://openalex.org/keywords/spectrogram","display_name":"Spectrogram","score":0.8417161703109741},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6501463055610657},{"id":"https://openalex.org/keywords/sound","display_name":"Sound (geography)","score":0.6078097820281982},{"id":"https://openalex.org/keywords/detector","display_name":"Detector","score":0.5227620601654053},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.5166094899177551},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.47932469844818115},{"id":"https://openalex.org/keywords/transformation","display_name":"Transformation (genetics)","score":0.46168652176856995},{"id":"https://openalex.org/keywords/decomposition","display_name":"Decomposition","score":0.4570815861225128},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.43886882066726685},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.4299437701702118},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.37656158208847046},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3367788791656494},{"id":"https://openalex.org/keywords/acoustics","display_name":"Acoustics","score":0.2416735589504242},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.2044963836669922},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.16018056869506836},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.13339802622795105}],"concepts":[{"id":"https://openalex.org/C160844653","wikidata":"https://www.wikidata.org/wiki/Q150986","display_name":"Siren (mythology)","level":2,"score":0.9370377659797668},{"id":"https://openalex.org/C45273575","wikidata":"https://www.wikidata.org/wiki/Q578970","display_name":"Spectrogram","level":2,"score":0.8417161703109741},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6501463055610657},{"id":"https://openalex.org/C203718221","wikidata":"https://www.wikidata.org/wiki/Q491713","display_name":"Sound (geography)","level":2,"score":0.6078097820281982},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.5227620601654053},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.5166094899177551},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.47932469844818115},{"id":"https://openalex.org/C204241405","wikidata":"https://www.wikidata.org/wiki/Q461499","display_name":"Transformation (genetics)","level":3,"score":0.46168652176856995},{"id":"https://openalex.org/C124681953","wikidata":"https://www.wikidata.org/wiki/Q339062","display_name":"Decomposition","level":2,"score":0.4570815861225128},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.43886882066726685},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4299437701702118},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.37656158208847046},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3367788791656494},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.2416735589504242},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.2044963836669922},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.16018056869506836},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.13339802622795105},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C124952713","wikidata":"https://www.wikidata.org/wiki/Q8242","display_name":"Literature","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icccnt51525.2021.9579778","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icccnt51525.2021.9579778","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 12th International Conference on Computing Communication and Networking Technologies (ICCCNT)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/11","display_name":"Sustainable cities and communities","score":0.8600000143051147}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":35,"referenced_works":["https://openalex.org/W1430048851","https://openalex.org/W1964131130","https://openalex.org/W2031377442","https://openalex.org/W2038484192","https://openalex.org/W2135342008","https://openalex.org/W2171775068","https://openalex.org/W2191779130","https://openalex.org/W2258245936","https://openalex.org/W2588866295","https://openalex.org/W2751841560","https://openalex.org/W2796101164","https://openalex.org/W2888469011","https://openalex.org/W2889309940","https://openalex.org/W2891437363","https://openalex.org/W2902444285","https://openalex.org/W2909327627","https://openalex.org/W2964141725","https://openalex.org/W2973284423","https://openalex.org/W2990387791","https://openalex.org/W2995673094","https://openalex.org/W3013071107","https://openalex.org/W3021992411","https://openalex.org/W3030241088","https://openalex.org/W3082045506","https://openalex.org/W3082401322","https://openalex.org/W3082878506","https://openalex.org/W3094591342","https://openalex.org/W3095348033","https://openalex.org/W3102382472","https://openalex.org/W3106722373","https://openalex.org/W3131886871","https://openalex.org/W3157065363","https://openalex.org/W3160238633","https://openalex.org/W6754446152","https://openalex.org/W6786287574"],"related_works":["https://openalex.org/W2762764793","https://openalex.org/W2549936067","https://openalex.org/W2325061356","https://openalex.org/W2378218812","https://openalex.org/W2549439819","https://openalex.org/W2733934953","https://openalex.org/W2036202717","https://openalex.org/W1996448601","https://openalex.org/W1805378716","https://openalex.org/W2966307288"],"abstract_inverted_index":{"An":[0,22],"efficient":[1,42],"sound":[2,33,52,56,99],"classification":[3,53],"algorithm":[4,91],"can":[5],"benefit":[6],"a":[7,35,102],"multitude":[8],"of":[9,69,77,88,117],"applications":[10],"involving":[11],"home,":[12],"wildlife,":[13],"and":[14,28,43,50,64,71,101,123],"residential":[15],"surveillance,":[16],"traffic":[17],"regulation,":[18],"medical":[19],"monitoring":[20],"etc.":[21],"important":[23],"application":[24],"is":[25,84,92],"to":[26,57],"identify":[27],"notify":[29],"the":[30,75,78,89,120,126],"ambulance":[31,107],"siren":[32,48,108],"amidst":[34],"noisy":[36],"environment.":[37],"This":[38],"work":[39],"develops":[40],"an":[41,115],"less":[44],"complex":[45],"architecture":[46,80],"for":[47,97,106,119,125],"detection":[49],"urban":[51,98],"using":[54],"different":[55],"image":[58],"transformation":[59],"methods":[60],"viz:":[61],"Mel-spectrogram,":[62],"Scalogram":[63],"Fourier":[65],"decomposition":[66],"method(FDM).":[67],"Effects":[68],"augmentation":[70],"pre-processing":[72],"techniques":[73],"on":[74,94],"efficacy":[76],"developed":[79],"against":[81],"pre-trained":[82],"models":[83],"analyzed.":[85],"The":[86,110],"performance":[87],"proposed":[90,112],"tested":[93],"Urbansound8K":[95],"dataset":[96,105],"classification,":[100],"multi":[103],"-source":[104],"detector.":[109],"CNN":[111],"here":[113],"gives":[114],"accuracy":[116],"89.66%":[118],"former":[121],"case":[122],"99.35%":[124],"latter.":[127]},"counts_by_year":[{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
