{"id":"https://openalex.org/W2004453603","doi":"https://doi.org/10.1109/taslp.2014.2367821","title":"Inversion of auditory spectrograms, traditional spectrograms, and other envelope representations","display_name":"Inversion of auditory spectrograms, traditional spectrograms, and other envelope representations","publication_year":2014,"publication_date":"2014-01-01","ids":{"openalex":"https://openalex.org/W2004453603","doi":"https://doi.org/10.1109/taslp.2014.2367821","mag":"2004453603"},"language":"en","primary_location":{"id":"doi:10.1109/taslp.2014.2367821","is_oa":true,"landing_page_url":"https://doi.org/10.1109/taslp.2014.2367821","pdf_url":"https://ieeexplore.ieee.org/ielx7/6570655/7010069/06949659.pdf","source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://ieeexplore.ieee.org/ielx7/6570655/7010069/06949659.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5045215979","display_name":"Remi Julien Blaise Decorsi\u00e8re","orcid":null},"institutions":[{"id":"https://openalex.org/I96673099","display_name":"Technical University of Denmark","ror":"https://ror.org/04qtj9h94","country_code":"DK","type":"education","lineage":["https://openalex.org/I96673099"]}],"countries":["DK"],"is_corresponding":true,"raw_author_name":"Remi Decorsiere","raw_affiliation_strings":["Centre for Applied Hearing Research, Technical University of Denmark, Kongens Lyngby, Denmark"],"affiliations":[{"raw_affiliation_string":"Centre for Applied Hearing Research, Technical University of Denmark, Kongens Lyngby, Denmark","institution_ids":["https://openalex.org/I96673099"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084033010","display_name":"Peter S\u00f8ndergaard","orcid":"https://orcid.org/0000-0002-0964-9776"},"institutions":[{"id":"https://openalex.org/I4210130492","display_name":"Oticon Medical (Denmark)","ror":"https://ror.org/03c5ds320","country_code":"DK","type":"company","lineage":["https://openalex.org/I4210130492"]},{"id":"https://openalex.org/I96673099","display_name":"Technical University of Denmark","ror":"https://ror.org/04qtj9h94","country_code":"DK","type":"education","lineage":["https://openalex.org/I96673099"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Peter Sondergaard","raw_affiliation_strings":["Senior R&D Engineer with Oticon A/S, Sm\u00f8rum, Denmark","Center for Applied Hearing Research, Technical University of Denmark, Kongens Lyngby, Denmark"],"affiliations":[{"raw_affiliation_string":"Senior R&D Engineer with Oticon A/S, Sm\u00f8rum, Denmark","institution_ids":["https://openalex.org/I4210130492"]},{"raw_affiliation_string":"Center for Applied Hearing Research, Technical University of Denmark, Kongens Lyngby, Denmark","institution_ids":["https://openalex.org/I96673099"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054678574","display_name":"Ewen MacDonald","orcid":"https://orcid.org/0000-0002-6973-2926"},"institutions":[{"id":"https://openalex.org/I96673099","display_name":"Technical University of Denmark","ror":"https://ror.org/04qtj9h94","country_code":"DK","type":"education","lineage":["https://openalex.org/I96673099"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Ewen MacDonald","raw_affiliation_strings":["Centre for Applied Hearing Research, Technical University of Denmark, Kongens Lyngby, Denmark"],"affiliations":[{"raw_affiliation_string":"Centre for Applied Hearing Research, Technical University of Denmark, Kongens Lyngby, Denmark","institution_ids":["https://openalex.org/I96673099"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5046255570","display_name":"Torsten Dau","orcid":"https://orcid.org/0000-0001-8110-4343"},"institutions":[{"id":"https://openalex.org/I96673099","display_name":"Technical University of Denmark","ror":"https://ror.org/04qtj9h94","country_code":"DK","type":"education","lineage":["https://openalex.org/I96673099"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Torsten Dau","raw_affiliation_strings":["Centre for Applied Hearing Research, Technical University of Denmark, Kongens Lyngby, Denmark"],"affiliations":[{"raw_affiliation_string":"Centre for Applied Hearing Research, Technical University of Denmark, Kongens Lyngby, Denmark","institution_ids":["https://openalex.org/I96673099"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5045215979"],"corresponding_institution_ids":["https://openalex.org/I96673099"],"apc_list":null,"apc_paid":null,"fwci":0.9405,"has_fulltext":true,"cited_by_count":24,"citation_normalized_percentile":{"value":0.73025654,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"1"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10283","display_name":"Hearing Loss and Rehabilitation","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10283","display_name":"Hearing Loss and Rehabilitation","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9926999807357788,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10788","display_name":"Neuroscience and Music Perception","score":0.9873999953269958,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/spectrogram","display_name":"Spectrogram","score":0.9696987867355347},{"id":"https://openalex.org/keywords/inversion","display_name":"Inversion (geology)","score":0.6465155482292175},{"id":"https://openalex.org/keywords/envelope","display_name":"Envelope (radar)","score":0.5584387183189392},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4171249270439148},{"id":"https://openalex.org/keywords/acoustics","display_name":"Acoustics","score":0.3929433822631836},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.3872770369052887},{"id":"https://openalex.org/keywords/geology","display_name":"Geology","score":0.314192533493042},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.2423078417778015},{"id":"https://openalex.org/keywords/seismology","display_name":"Seismology","score":0.2121703326702118},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.10766139626502991}],"concepts":[{"id":"https://openalex.org/C45273575","wikidata":"https://www.wikidata.org/wiki/Q578970","display_name":"Spectrogram","level":2,"score":0.9696987867355347},{"id":"https://openalex.org/C1893757","wikidata":"https://www.wikidata.org/wiki/Q3653001","display_name":"Inversion (geology)","level":3,"score":0.6465155482292175},{"id":"https://openalex.org/C65155139","wikidata":"https://www.wikidata.org/wiki/Q5380912","display_name":"Envelope (radar)","level":3,"score":0.5584387183189392},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4171249270439148},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.3929433822631836},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.3872770369052887},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.314192533493042},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.2423078417778015},{"id":"https://openalex.org/C165205528","wikidata":"https://www.wikidata.org/wiki/Q83371","display_name":"Seismology","level":1,"score":0.2121703326702118},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.10766139626502991},{"id":"https://openalex.org/C77928131","wikidata":"https://www.wikidata.org/wiki/Q193343","display_name":"Tectonics","level":2,"score":0.0},{"id":"https://openalex.org/C554190296","wikidata":"https://www.wikidata.org/wiki/Q47528","display_name":"Radar","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/taslp.2014.2367821","is_oa":true,"landing_page_url":"https://doi.org/10.1109/taslp.2014.2367821","pdf_url":"https://ieeexplore.ieee.org/ielx7/6570655/7010069/06949659.pdf","source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},{"id":"pmh:oai:pure.atira.dk:publications/2338f310-194d-49f9-85dd-1e87ea3760fd","is_oa":true,"landing_page_url":"https://orbit.dtu.dk/en/publications/2338f310-194d-49f9-85dd-1e87ea3760fd","pdf_url":null,"source":{"id":"https://openalex.org/S4306400705","display_name":"Technical University of Denmark, DTU Orbit (Technical University of Denmark, DTU)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I96673099","host_organization_name":"Technical University of Denmark","host_organization_lineage":["https://openalex.org/I96673099"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Decorsi\u00e8re , R J B , S\u00f8ndergaard , P L , MacDonald , E &amp; Dau , T 2015 , ' Inversion of Auditory Spectrograms, Traditional Spectrograms, and Other Envelope Representations ' , I E E E Transactions on Audio, Speech and Language Processing , vol. 23 , no. 1 , pp. 46-56 .","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/taslp.2014.2367821","is_oa":true,"landing_page_url":"https://doi.org/10.1109/taslp.2014.2367821","pdf_url":"https://ieeexplore.ieee.org/ielx7/6570655/7010069/06949659.pdf","source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.5099999904632568,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2004453603.pdf","grobid_xml":"https://content.openalex.org/works/W2004453603.grobid-xml"},"referenced_works_count":32,"referenced_works":["https://openalex.org/W166394536","https://openalex.org/W1511414143","https://openalex.org/W1545406001","https://openalex.org/W1974778974","https://openalex.org/W1974932989","https://openalex.org/W1987831012","https://openalex.org/W2028138004","https://openalex.org/W2028923004","https://openalex.org/W2029654180","https://openalex.org/W2041777218","https://openalex.org/W2050758723","https://openalex.org/W2051434435","https://openalex.org/W2054139811","https://openalex.org/W2059744545","https://openalex.org/W2061249192","https://openalex.org/W2065691163","https://openalex.org/W2090135651","https://openalex.org/W2095992616","https://openalex.org/W2107535961","https://openalex.org/W2120847449","https://openalex.org/W2159271068","https://openalex.org/W2159300614","https://openalex.org/W2167850383","https://openalex.org/W2401387233","https://openalex.org/W2556247670","https://openalex.org/W2600596419","https://openalex.org/W2741913599","https://openalex.org/W2964084773","https://openalex.org/W4244253603","https://openalex.org/W6606689292","https://openalex.org/W6630600482","https://openalex.org/W6632590417"],"related_works":["https://openalex.org/W2530685530","https://openalex.org/W4375868962","https://openalex.org/W2011227383","https://openalex.org/W2088854863","https://openalex.org/W4402568167","https://openalex.org/W2942893872","https://openalex.org/W3179495260","https://openalex.org/W1976719989","https://openalex.org/W2897924318","https://openalex.org/W2138997758"],"abstract_inverted_index":{"Envelope":[0],"representations":[1],"such":[2],"as":[3],"the":[4,13,18,30,36,63,72,97,102,105,114,125,143,161,164,177],"auditory":[5,94,141],"or":[6,33,44],"traditional":[7,157,189],"spectrogram":[8],"can":[9,137],"be":[10],"defined":[11],"by":[12,169],"set":[14],"of":[15,20,35,81,88,104,116,163,172,188],"envelopes":[16],"from":[17],"outputs":[19],"a":[21,46,58,75,82,128,174,184],"filterbank.":[22],"Common":[23],"envelope":[24,52,77,109],"extraction":[25,110],"methods":[26],"discard":[27],"information":[28],"regarding":[29],"fast":[31],"fluctuations,":[32],"phase,":[34],"signal.":[37,85],"Thus,":[38],"it":[39],"is":[40,66,99,111,122,127,132,154,179],"difficult":[41],"to":[42,156,176,183],"invert,":[43],"reconstruct":[45],"time-domain":[47,84,149],"signal":[48],"from,":[49],"an":[50,140],"arbitrary":[51],"representation.":[53],"To":[54],"address":[55],"this":[56,89],"problem,":[57],"general":[59],"optimization":[60],"approach":[61,130,145],"in":[62],"time":[64],"domain":[65],"proposed":[67],"here,":[68],"which":[69,181],"iteratively":[70],"minimizes":[71],"distance":[73],"between":[74],"target":[76],"representation":[78],"and":[79,108],"that":[80,131],"reconstructed":[83],"Two":[86],"implementations":[87],"framework":[90,153,178],"are":[91],"presented":[92],"for":[93],"spectrograms,":[95],"where":[96],"filterbank":[98],"based":[100,159],"on":[101,113,148,160],"behavior":[103],"basilar":[106],"membrane":[107],"modeled":[112],"response":[115],"inner":[117],"hair":[118],"cells.":[119],"One":[120],"implementation":[121],"direct":[123],"while":[124],"other":[126],"two-stage":[129,144],"computationally":[133],"simpler.":[134],"While":[135],"both":[136],"accurately":[138],"invert":[139],"spectrogram,":[142],"performs":[146],"better":[147],"metrics.":[150],"The":[151],"same":[152],"applied":[155],"spectrograms":[158],"magnitude":[162],"short-time":[165],"Fourier":[166],"transform.":[167],"Inspired":[168],"human":[170],"perception":[171],"loudness,":[173],"modification":[175],"proposed,":[180],"leads":[182],"more":[185],"accurate":[186],"inversion":[187],"spectrograms.":[190]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":6},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":3},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":2}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
