{"id":"https://openalex.org/W2066201752","doi":"https://doi.org/10.1109/icdsp.2014.6900815","title":"Audio surveillance under noisy conditions using time-frequency image feature","display_name":"Audio surveillance under noisy conditions using time-frequency image feature","publication_year":2014,"publication_date":"2014-08-01","ids":{"openalex":"https://openalex.org/W2066201752","doi":"https://doi.org/10.1109/icdsp.2014.6900815","mag":"2066201752"},"language":"en","primary_location":{"id":"doi:10.1109/icdsp.2014.6900815","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icdsp.2014.6900815","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 19th International Conference on Digital Signal Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5023279352","display_name":"Roneel V. Sharan","orcid":"https://orcid.org/0000-0003-1079-8709"},"institutions":[{"id":"https://openalex.org/I39854758","display_name":"Auckland University of Technology","ror":"https://ror.org/01zvqw119","country_code":"NZ","type":"education","lineage":["https://openalex.org/I39854758"]}],"countries":["NZ"],"is_corresponding":true,"raw_author_name":"Roneel V. Sharan","raw_affiliation_strings":["School of Engineering, Auckland University of Technology, Auckland, New Zealand","School of Engineering, Auckland University of Technology, Private Bag 92006, Auckland 1142, New Zealand"],"affiliations":[{"raw_affiliation_string":"School of Engineering, Auckland University of Technology, Auckland, New Zealand","institution_ids":["https://openalex.org/I39854758"]},{"raw_affiliation_string":"School of Engineering, Auckland University of Technology, Private Bag 92006, Auckland 1142, New Zealand","institution_ids":["https://openalex.org/I39854758"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5044116630","display_name":"T.J. Moir","orcid":"https://orcid.org/0000-0002-4291-6143"},"institutions":[{"id":"https://openalex.org/I39854758","display_name":"Auckland University of Technology","ror":"https://ror.org/01zvqw119","country_code":"NZ","type":"education","lineage":["https://openalex.org/I39854758"]}],"countries":["NZ"],"is_corresponding":false,"raw_author_name":"Tom J. Moir","raw_affiliation_strings":["School of Engineering, Auckland University of Technology, Auckland, New Zealand","School of Engineering, Auckland University of Technology, Private Bag 92006, Auckland 1142, New Zealand"],"affiliations":[{"raw_affiliation_string":"School of Engineering, Auckland University of Technology, Auckland, New Zealand","institution_ids":["https://openalex.org/I39854758"]},{"raw_affiliation_string":"School of Engineering, Auckland University of Technology, Private Bag 92006, Auckland 1142, New Zealand","institution_ids":["https://openalex.org/I39854758"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5023279352"],"corresponding_institution_ids":["https://openalex.org/I39854758"],"apc_list":null,"apc_paid":null,"fwci":0.8734,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.74839419,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"130","last_page":"135"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.9889000058174133,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/grayscale","display_name":"Grayscale","score":0.8705167770385742},{"id":"https://openalex.org/keywords/normalization","display_name":"Normalization (sociology)","score":0.7339242100715637},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7109990119934082},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5865170359611511},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5714966058731079},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.48874950408935547},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.4691796600818634},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.37463003396987915},{"id":"https://openalex.org/keywords/pixel","display_name":"Pixel","score":0.2908463180065155},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.24744468927383423}],"concepts":[{"id":"https://openalex.org/C78201319","wikidata":"https://www.wikidata.org/wiki/Q685727","display_name":"Grayscale","level":3,"score":0.8705167770385742},{"id":"https://openalex.org/C136886441","wikidata":"https://www.wikidata.org/wiki/Q926129","display_name":"Normalization (sociology)","level":2,"score":0.7339242100715637},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7109990119934082},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5865170359611511},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5714966058731079},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.48874950408935547},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.4691796600818634},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.37463003396987915},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.2908463180065155},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.24744468927383423},{"id":"https://openalex.org/C19165224","wikidata":"https://www.wikidata.org/wiki/Q23404","display_name":"Anthropology","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icdsp.2014.6900815","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icdsp.2014.6900815","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 19th International Conference on Digital Signal Processing","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":23,"referenced_works":["https://openalex.org/W1560641100","https://openalex.org/W1593093587","https://openalex.org/W1974387177","https://openalex.org/W2059432853","https://openalex.org/W2090431713","https://openalex.org/W2101626343","https://openalex.org/W2113278353","https://openalex.org/W2114486803","https://openalex.org/W2121961612","https://openalex.org/W2130640900","https://openalex.org/W2153104898","https://openalex.org/W2157239837","https://openalex.org/W2159957507","https://openalex.org/W2168228682","https://openalex.org/W2168441989","https://openalex.org/W2170355566","https://openalex.org/W2245569228","https://openalex.org/W4254721730","https://openalex.org/W4312326823","https://openalex.org/W6633570323","https://openalex.org/W6678381582","https://openalex.org/W6683380652","https://openalex.org/W6690610466"],"related_works":["https://openalex.org/W115686965","https://openalex.org/W2768918307","https://openalex.org/W2040020606","https://openalex.org/W2110031805","https://openalex.org/W2591697403","https://openalex.org/W4362659915","https://openalex.org/W2953716828","https://openalex.org/W2904857019","https://openalex.org/W2113071088","https://openalex.org/W2359610660"],"abstract_inverted_index":{"In":[0,26],"this":[1],"paper,":[2],"we":[3,28,90],"use":[4],"the":[5,13,56,70,74,81,95,135,138,151],"novel":[6],"method":[7],"of":[8,17,55,60,80,94],"using":[9,127,164],"features":[10,169],"extracted":[11],"from":[12],"time-frequency":[14],"image":[15,31,84,101,141,154],"representation":[16],"a":[18,41,49,86,172],"sound":[19,42,178],"signal":[20,43],"in":[21,112,176],"an":[22],"audio":[23],"surveillance":[24],"application.":[25],"particular,":[27],"investigate":[29],"two":[30],"representations:":[32],"linear":[33,75,139],"grayscale":[34,76,83,140,153],"and":[35,47,66,107,123],"log":[36,82,92,152],"grayscale.":[37],"We":[38,115],"first":[39],"divide":[40],"into":[44,105],"smaller":[45],"frames":[46],"apply":[48],"windowing":[50],"function.":[51],"The":[52,78],"absolute":[53],"value":[54],"Discrete":[57],"Fourier":[58],"Transform":[59],"each":[61,113],"frame":[62],"is":[63,102,143,171],"then":[64,103],"computed":[65,111],"normalized":[67],"to":[68,145,160],"get":[69],"intensity":[71],"values":[72,96],"for":[73,131],"image.":[77],"generation":[79],"takes":[85],"similar":[87],"approach":[88,142],"but":[89],"take":[91],"power":[93],"before":[97],"data":[98],"normalization.":[99],"Each":[100],"divided":[104],"blocks":[106],"central":[108],"moments":[109],"are":[110],"block.":[114],"carry":[116],"out":[117],"experimentation":[118],"under":[119],"different":[120],"noise":[121,148],"conditions":[122],"varying":[124],"signal-to-noise":[125],"ratio":[126],"support":[128],"vector":[129],"machines":[130],"classification.":[132],"Based":[133],"on":[134],"classification":[136],"accuracy,":[137],"found":[144,159],"be":[146],"more":[147],"robust":[149],"than":[150,163],"approach.":[155],"It":[156],"was":[157],"also":[158],"perform":[161],"better":[162],"mel-frequency":[165],"cepstral":[166],"coefficients":[167],"as":[168],"which":[170],"common":[173],"baseline":[174],"feature":[175],"most":[177],"recognition":[179],"applications.":[180]},"counts_by_year":[{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1},{"year":2018,"cited_by_count":2},{"year":2016,"cited_by_count":2},{"year":2015,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
