{"id":"https://openalex.org/W2100375615","doi":"https://doi.org/10.1109/icassp.2011.5946442","title":"Audio signal classification with temporal envelopes","display_name":"Audio signal classification with temporal envelopes","publication_year":2011,"publication_date":"2011-05-01","ids":{"openalex":"https://openalex.org/W2100375615","doi":"https://doi.org/10.1109/icassp.2011.5946442","mag":"2100375615"},"language":"en","primary_location":{"id":"doi:10.1109/icassp.2011.5946442","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2011.5946442","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2011 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113349806","display_name":"M. Umair Bin Altaf","orcid":null},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"M Umair Bin Altaf","raw_affiliation_strings":["School of Electrical and Computer Engineering, Georgia Institute of Technology, Atlanta, GA, USA","School of Electrical & Computer Engineering, Georgia Institute of Technology, Atlanta 30332, USA"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Computer Engineering, Georgia Institute of Technology, Atlanta, GA, USA","institution_ids":["https://openalex.org/I130701444"]},{"raw_affiliation_string":"School of Electrical & Computer Engineering, Georgia Institute of Technology, Atlanta 30332, USA","institution_ids":["https://openalex.org/I130701444"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5070867959","display_name":"Biing\u2010Hwang Juang","orcid":"https://orcid.org/0000-0002-5773-5679"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Biing-Hwang Juang","raw_affiliation_strings":["School of Electrical and Computer Engineering, Georgia Institute of Technology, Atlanta, GA, USA","School of Electrical & Computer Engineering, Georgia Institute of Technology, Atlanta 30332, USA"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Computer Engineering, Georgia Institute of Technology, Atlanta, GA, USA","institution_ids":["https://openalex.org/I130701444"]},{"raw_affiliation_string":"School of Electrical & Computer Engineering, Georgia Institute of Technology, Atlanta 30332, USA","institution_ids":["https://openalex.org/I130701444"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5113349806"],"corresponding_institution_ids":["https://openalex.org/I130701444"],"apc_list":null,"apc_paid":null,"fwci":0.2748,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.57894165,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"469","last_page":"472"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10283","display_name":"Hearing Loss and Rehabilitation","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10283","display_name":"Hearing Loss and Rehabilitation","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10788","display_name":"Neuroscience and Music Perception","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.707334041595459},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6792634725570679},{"id":"https://openalex.org/keywords/audio-signal-processing","display_name":"Audio signal processing","score":0.6312376260757446},{"id":"https://openalex.org/keywords/audio-signal","display_name":"Audio signal","score":0.623080849647522},{"id":"https://openalex.org/keywords/spectral-envelope","display_name":"Spectral envelope","score":0.6124239563941956},{"id":"https://openalex.org/keywords/signal-processing","display_name":"Signal processing","score":0.607266366481781},{"id":"https://openalex.org/keywords/signal","display_name":"SIGNAL (programming language)","score":0.6007227897644043},{"id":"https://openalex.org/keywords/envelope","display_name":"Envelope (radar)","score":0.583268940448761},{"id":"https://openalex.org/keywords/frequency-domain","display_name":"Frequency domain","score":0.5134421586990356},{"id":"https://openalex.org/keywords/time\u2013frequency-analysis","display_name":"Time\u2013frequency analysis","score":0.501145601272583},{"id":"https://openalex.org/keywords/spectral-density","display_name":"Spectral density","score":0.485825777053833},{"id":"https://openalex.org/keywords/spectrogram","display_name":"Spectrogram","score":0.4856623411178589},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.44147688150405884},{"id":"https://openalex.org/keywords/audio-analyzer","display_name":"Audio analyzer","score":0.4269216060638428},{"id":"https://openalex.org/keywords/audio-signal-flow","display_name":"Audio signal flow","score":0.426284521818161},{"id":"https://openalex.org/keywords/multidimensional-signal-processing","display_name":"Multidimensional signal processing","score":0.41183120012283325},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.36354494094848633},{"id":"https://openalex.org/keywords/speech-coding","display_name":"Speech coding","score":0.35070037841796875},{"id":"https://openalex.org/keywords/digital-signal-processing","display_name":"Digital signal processing","score":0.18152570724487305},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.1427980363368988},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.10506623983383179}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.707334041595459},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6792634725570679},{"id":"https://openalex.org/C127220857","wikidata":"https://www.wikidata.org/wiki/Q2719318","display_name":"Audio signal processing","level":4,"score":0.6312376260757446},{"id":"https://openalex.org/C64922751","wikidata":"https://www.wikidata.org/wiki/Q4650799","display_name":"Audio signal","level":3,"score":0.623080849647522},{"id":"https://openalex.org/C54926389","wikidata":"https://www.wikidata.org/wiki/Q7575188","display_name":"Spectral envelope","level":2,"score":0.6124239563941956},{"id":"https://openalex.org/C104267543","wikidata":"https://www.wikidata.org/wiki/Q208163","display_name":"Signal processing","level":3,"score":0.607266366481781},{"id":"https://openalex.org/C2779843651","wikidata":"https://www.wikidata.org/wiki/Q7390335","display_name":"SIGNAL (programming language)","level":2,"score":0.6007227897644043},{"id":"https://openalex.org/C65155139","wikidata":"https://www.wikidata.org/wiki/Q5380912","display_name":"Envelope (radar)","level":3,"score":0.583268940448761},{"id":"https://openalex.org/C19118579","wikidata":"https://www.wikidata.org/wiki/Q786423","display_name":"Frequency domain","level":2,"score":0.5134421586990356},{"id":"https://openalex.org/C142433447","wikidata":"https://www.wikidata.org/wiki/Q7806653","display_name":"Time\u2013frequency analysis","level":3,"score":0.501145601272583},{"id":"https://openalex.org/C168110828","wikidata":"https://www.wikidata.org/wiki/Q1331626","display_name":"Spectral density","level":2,"score":0.485825777053833},{"id":"https://openalex.org/C45273575","wikidata":"https://www.wikidata.org/wiki/Q578970","display_name":"Spectrogram","level":2,"score":0.4856623411178589},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.44147688150405884},{"id":"https://openalex.org/C160372630","wikidata":"https://www.wikidata.org/wiki/Q4819855","display_name":"Audio analyzer","level":5,"score":0.4269216060638428},{"id":"https://openalex.org/C167940747","wikidata":"https://www.wikidata.org/wiki/Q63727227","display_name":"Audio signal flow","level":5,"score":0.426284521818161},{"id":"https://openalex.org/C501101116","wikidata":"https://www.wikidata.org/wiki/Q18378116","display_name":"Multidimensional signal processing","level":4,"score":0.41183120012283325},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.36354494094848633},{"id":"https://openalex.org/C13895895","wikidata":"https://www.wikidata.org/wiki/Q3270773","display_name":"Speech coding","level":2,"score":0.35070037841796875},{"id":"https://openalex.org/C84462506","wikidata":"https://www.wikidata.org/wiki/Q173142","display_name":"Digital signal processing","level":2,"score":0.18152570724487305},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.1427980363368988},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.10506623983383179},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C554190296","wikidata":"https://www.wikidata.org/wiki/Q47528","display_name":"Radar","level":2,"score":0.0},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp.2011.5946442","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2011.5946442","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2011 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W101319899","https://openalex.org/W1968707255","https://openalex.org/W1973746598","https://openalex.org/W1974932989","https://openalex.org/W2013020033","https://openalex.org/W2022349254","https://openalex.org/W2087596342","https://openalex.org/W2090135651","https://openalex.org/W2105595944","https://openalex.org/W2114537326","https://openalex.org/W2122832694","https://openalex.org/W2126617887","https://openalex.org/W2139731495","https://openalex.org/W2148734646","https://openalex.org/W2153220212","https://openalex.org/W2175659613"],"related_works":["https://openalex.org/W2098934641","https://openalex.org/W4387698063","https://openalex.org/W2363106653","https://openalex.org/W2019256813","https://openalex.org/W1975359510","https://openalex.org/W2103045678","https://openalex.org/W4214771044","https://openalex.org/W2494533082","https://openalex.org/W4382560817","https://openalex.org/W3110605476"],"abstract_inverted_index":{"The":[0],"conventional":[1],"approach":[2],"to":[3,19,51,60,63,87],"audio":[4,21,43,67],"processing,":[5],"based":[6],"on":[7],"the":[8,36,42,46,78,88],"short-time":[9],"power":[10],"spectrum":[11],"model,":[12],"is":[13,57,85],"not":[14],"adequate":[15],"when":[16,83],"it":[17,72],"comes":[18],"general":[20],"signals.":[22],"We":[23,69],"propose":[24],"an":[25,53],"approach,":[26],"justified":[27],"by":[28],"studies":[29],"from":[30,47],"psycho-acoustics":[31],"and":[32,38],"neuroimaging,":[33],"which":[34,56,80],"uses":[35],"magnitude":[37],"frequency":[39],"envelope":[40],"of":[41,48,77],"signal":[44,79],"in":[45],"AM-FM":[49],"modulations":[50],"build":[52],"ARMA":[54],"model":[55],"then":[58],"fed":[59],"a":[61],"GMM":[62],"classify":[64],"into":[65],"various":[66],"classes.":[68],"show":[70],"that":[71],"makes":[73],"explicit":[74],"certain":[75],"aspects":[76],"are":[81],"overlooked":[82],"processing":[84],"limited":[86],"spectral":[89],"domain.":[90]},"counts_by_year":[{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":2},{"year":2014,"cited_by_count":1},{"year":2012,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
