{"id":"https://openalex.org/W2874689226","doi":"https://doi.org/10.1109/iwaenc.2018.8521313","title":"Phase Reconstruction from Amplitude Spectrograms Based on Von-Mises-Distribution Deep Neural Network","display_name":"Phase Reconstruction from Amplitude Spectrograms Based on Von-Mises-Distribution Deep Neural Network","publication_year":2018,"publication_date":"2018-09-01","ids":{"openalex":"https://openalex.org/W2874689226","doi":"https://doi.org/10.1109/iwaenc.2018.8521313","mag":"2874689226"},"language":"en","primary_location":{"id":"doi:10.1109/iwaenc.2018.8521313","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iwaenc.2018.8521313","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 16th International Workshop on Acoustic Signal Enhancement (IWAENC)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5013050263","display_name":"Shinnosuke Takamichi","orcid":"https://orcid.org/0000-0003-0520-7847"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Shinnosuke Takamichi","raw_affiliation_strings":["Graduate School of Information Science and Technology, The University of Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Information Science and Technology, The University of Tokyo, Japan","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083394213","display_name":"Yuki Saito","orcid":"https://orcid.org/0000-0002-7967-2613"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Yuki Saito","raw_affiliation_strings":["Graduate School of Information Science and Technology, The University of Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Information Science and Technology, The University of Tokyo, Japan","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051506797","display_name":"Norihiro Takamune","orcid":"https://orcid.org/0000-0002-8102-3110"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Norihiro Takamune","raw_affiliation_strings":["Graduate School of Information Science and Technology, The University of Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Information Science and Technology, The University of Tokyo, Japan","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071479017","display_name":"Daichi Kitamura","orcid":"https://orcid.org/0000-0003-1117-7939"},"institutions":[{"id":"https://openalex.org/I4210120810","display_name":"National Institute of Technology","ror":"https://ror.org/02xqkcw08","country_code":"JP","type":"education","lineage":["https://openalex.org/I4210120810"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Daichi Kitamura","raw_affiliation_strings":["Department of Electrical and Computer Engineering, National Institute of Technology, Japan"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, National Institute of Technology, Japan","institution_ids":["https://openalex.org/I4210120810"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5003814223","display_name":"Hiroshi Saruwatari","orcid":"https://orcid.org/0000-0003-0876-5617"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Hiroshi Saruwatari","raw_affiliation_strings":["Graduate School of Information Science and Technology, The University of Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Information Science and Technology, The University of Tokyo, Japan","institution_ids":["https://openalex.org/I74801974"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5013050263"],"corresponding_institution_ids":["https://openalex.org/I74801974"],"apc_list":null,"apc_paid":null,"fwci":3.97340855,"has_fulltext":false,"cited_by_count":43,"citation_normalized_percentile":{"value":0.94080212,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"286","last_page":"290"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11447","display_name":"Blind Source Separation Techniques","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/spectrogram","display_name":"Spectrogram","score":0.9661874771118164},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5860699415206909},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5487710237503052},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5305260419845581},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.46768122911453247},{"id":"https://openalex.org/keywords/group-delay-and-phase-delay","display_name":"Group delay and phase delay","score":0.45876070857048035},{"id":"https://openalex.org/keywords/phase","display_name":"Phase (matter)","score":0.4462069571018219},{"id":"https://openalex.org/keywords/amplitude","display_name":"Amplitude","score":0.4334900379180908},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4330289661884308},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.2219209372997284},{"id":"https://openalex.org/keywords/filter","display_name":"Filter (signal processing)","score":0.0909683108329773},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.08364260196685791}],"concepts":[{"id":"https://openalex.org/C45273575","wikidata":"https://www.wikidata.org/wiki/Q578970","display_name":"Spectrogram","level":2,"score":0.9661874771118164},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5860699415206909},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5487710237503052},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5305260419845581},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.46768122911453247},{"id":"https://openalex.org/C123792056","wikidata":"https://www.wikidata.org/wiki/Q365988","display_name":"Group delay and phase delay","level":3,"score":0.45876070857048035},{"id":"https://openalex.org/C44280652","wikidata":"https://www.wikidata.org/wiki/Q104837","display_name":"Phase (matter)","level":2,"score":0.4462069571018219},{"id":"https://openalex.org/C180205008","wikidata":"https://www.wikidata.org/wiki/Q159190","display_name":"Amplitude","level":2,"score":0.4334900379180908},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4330289661884308},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.2219209372997284},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.0909683108329773},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.08364260196685791},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iwaenc.2018.8521313","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iwaenc.2018.8521313","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 16th International Workshop on Acoustic Signal Enhancement (IWAENC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.6100000143051147}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":34,"referenced_works":["https://openalex.org/W1487641199","https://openalex.org/W1502723613","https://openalex.org/W1519782245","https://openalex.org/W1896470158","https://openalex.org/W2020108938","https://openalex.org/W2043734309","https://openalex.org/W2087316977","https://openalex.org/W2099471712","https://openalex.org/W2102003408","https://openalex.org/W2120847449","https://openalex.org/W2129082420","https://openalex.org/W2129142580","https://openalex.org/W2146502635","https://openalex.org/W2156387975","https://openalex.org/W2395700867","https://openalex.org/W2567070169","https://openalex.org/W2607404225","https://openalex.org/W2749881488","https://openalex.org/W2765486990","https://openalex.org/W2807065297","https://openalex.org/W2950292946","https://openalex.org/W2962916039","https://openalex.org/W2963609956","https://openalex.org/W2963970792","https://openalex.org/W2963971656","https://openalex.org/W3021520245","https://openalex.org/W4246202668","https://openalex.org/W4320013936","https://openalex.org/W6629354409","https://openalex.org/W6675380101","https://openalex.org/W6681435938","https://openalex.org/W6682889407","https://openalex.org/W6711832335","https://openalex.org/W6743594052"],"related_works":["https://openalex.org/W2530685530","https://openalex.org/W4375868962","https://openalex.org/W2011227383","https://openalex.org/W2088854863","https://openalex.org/W3179495260","https://openalex.org/W1976719989","https://openalex.org/W2942893872","https://openalex.org/W3127543252","https://openalex.org/W2897924318","https://openalex.org/W2138997758"],"abstract_inverted_index":{"This":[0],"paper":[1],"presents":[2],"a":[3,69,82,87,109,123],"deep":[4],"neural":[5],"network":[6],"(DNN)-based":[7],"phase":[8,30,64,148],"reconstruction":[9,149],"from":[10,34],"amplitude":[11,20,36],"spectrograms.":[12],"In":[13],"audio":[14],"signal":[15],"and":[16,27,89,145],"speech":[17,153],"processing,":[18,26],"the":[19,28,35,39,42,46,60,73,90,94,99,102,117,133,156],"spectrogram":[21,31,37],"is":[22,32,68],"often":[23],"used":[24],"for":[25,63,112],"corresponding":[29],"reconstructed":[33],"on":[38,98],"basis":[40,100],"of":[41,81,93,101],"Griffin-Lim":[43,47,158],"method.":[44,159],"However,":[45],"method":[48],"causes":[49],"unnatural":[50],"artifacts":[51],"in":[52],"synthetic":[53],"speech.":[54],"Addressing":[55],"this":[56],"problem,":[57],"we":[58,107],"introduce":[59],"von-Mises-distribution":[61],"DNN":[62,67,95,113,135],"reconstruction.":[65],"The":[66,127],"generative":[70],"model":[71,79,91],"having":[72],"von":[74],"Mises":[75],"distribution":[76],"that":[77,131],"can":[78,136],"distributions":[80],"periodic":[83],"variable":[84],"such":[85],"as":[86],"phase,":[88],"parameters":[92],"are":[96],"estimated":[97],"maximum":[103],"likelihood":[104],"criterion.":[105],"Furthermore,":[106],"propose":[108],"group-delay":[110],"loss":[111],"training":[114],"to":[115,122],"make":[116],"predicted":[118],"group":[119,125,138],"delay":[120,139],"close":[121],"natural":[124],"delay.":[126],"experimental":[128],"results":[129],"demonstrate":[130],"1)":[132],"trained":[134],"predict":[137],"accurately":[140],"more":[141],"than":[142,155],"phases":[143],"themselves,":[144],"2)":[146],"our":[147],"methods":[150],"achieve":[151],"better":[152],"quality":[154],"conventional":[157]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":8},{"year":2022,"cited_by_count":6},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":9},{"year":2019,"cited_by_count":10}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
