{"id":"https://openalex.org/W2803849611","doi":"https://doi.org/10.1109/icassp.2018.8461501","title":"On the Importance of Analytic Phase of Speech Signals in Spoken Language Recognition","display_name":"On the Importance of Analytic Phase of Speech Signals in Spoken Language Recognition","publication_year":2018,"publication_date":"2018-04-01","ids":{"openalex":"https://openalex.org/W2803849611","doi":"https://doi.org/10.1109/icassp.2018.8461501","mag":"2803849611"},"language":"en","primary_location":{"id":"doi:10.1109/icassp.2018.8461501","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2018.8461501","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5016027101","display_name":"Karthika Vijayan","orcid":"https://orcid.org/0000-0001-7281-1329"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":true,"raw_author_name":"Karthika Vijayan","raw_affiliation_strings":["Dept. of Electrical and Computer Engineering, National University of Singapore","Dept. of Electrical and Computer Engineering, National University of Singapore#TAB#"],"affiliations":[{"raw_affiliation_string":"Dept. of Electrical and Computer Engineering, National University of Singapore","institution_ids":["https://openalex.org/I165932596"]},{"raw_affiliation_string":"Dept. of Electrical and Computer Engineering, National University of Singapore#TAB#","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032690182","display_name":"Haizhou Li","orcid":"https://orcid.org/0000-0001-9158-9401"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Haizhou Li","raw_affiliation_strings":["Dept. of Electrical and Computer Engineering, National University of Singapore","Dept. of Electrical and Computer Engineering, National University of Singapore#TAB#"],"affiliations":[{"raw_affiliation_string":"Dept. of Electrical and Computer Engineering, National University of Singapore","institution_ids":["https://openalex.org/I165932596"]},{"raw_affiliation_string":"Dept. of Electrical and Computer Engineering, National University of Singapore#TAB#","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100813843","display_name":"Hanwu Sun","orcid":null},"institutions":[{"id":"https://openalex.org/I115228651","display_name":"Agency for Science, Technology and Research","ror":"https://ror.org/036wvzt09","country_code":"SG","type":"government","lineage":["https://openalex.org/I115228651"]},{"id":"https://openalex.org/I3005327000","display_name":"Institute for Infocomm Research","ror":"https://ror.org/053rfa017","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I3005327000","https://openalex.org/I91275662"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Hanwu Sun","raw_affiliation_strings":["Human Language Technology Dept., Institute for Infocomm Research, Singapore","[Human Language Technology Dept., A *STAR, Institute for Infocomm Research, Singapore]"],"affiliations":[{"raw_affiliation_string":"Human Language Technology Dept., Institute for Infocomm Research, Singapore","institution_ids":["https://openalex.org/I3005327000"]},{"raw_affiliation_string":"[Human Language Technology Dept., A *STAR, Institute for Infocomm Research, Singapore]","institution_ids":["https://openalex.org/I3005327000","https://openalex.org/I115228651"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5004287909","display_name":"Kong Aik Lee","orcid":"https://orcid.org/0000-0001-9133-3000"},"institutions":[{"id":"https://openalex.org/I115228651","display_name":"Agency for Science, Technology and Research","ror":"https://ror.org/036wvzt09","country_code":"SG","type":"government","lineage":["https://openalex.org/I115228651"]},{"id":"https://openalex.org/I3005327000","display_name":"Institute for Infocomm Research","ror":"https://ror.org/053rfa017","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I3005327000","https://openalex.org/I91275662"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Kong Aik Lee","raw_affiliation_strings":["Human Language Technology Dept., Institute for Infocomm Research, Singapore","[Human Language Technology Dept., A *STAR, Institute for Infocomm Research, Singapore]"],"affiliations":[{"raw_affiliation_string":"Human Language Technology Dept., Institute for Infocomm Research, Singapore","institution_ids":["https://openalex.org/I3005327000"]},{"raw_affiliation_string":"[Human Language Technology Dept., A *STAR, Institute for Infocomm Research, Singapore]","institution_ids":["https://openalex.org/I3005327000","https://openalex.org/I115228651"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5016027101"],"corresponding_institution_ids":["https://openalex.org/I165932596"],"apc_list":null,"apc_paid":null,"fwci":0.8144,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.7915469,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"4","issue":null,"first_page":"5194","last_page":"5198"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mel-frequency-cepstrum","display_name":"Mel-frequency cepstrum","score":0.6552778482437134},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6353956460952759},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.607367753982544},{"id":"https://openalex.org/keywords/nist","display_name":"NIST","score":0.5927303433418274},{"id":"https://openalex.org/keywords/phase","display_name":"Phase (matter)","score":0.5072757601737976},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4928627014160156},{"id":"https://openalex.org/keywords/cepstrum","display_name":"Cepstrum","score":0.48578789830207825},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4466429650783539},{"id":"https://openalex.org/keywords/range","display_name":"Range (aeronautics)","score":0.44325560331344604},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.4228472113609314},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.2576238811016083},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.11132362484931946},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.09990623593330383}],"concepts":[{"id":"https://openalex.org/C151989614","wikidata":"https://www.wikidata.org/wiki/Q440370","display_name":"Mel-frequency cepstrum","level":3,"score":0.6552778482437134},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6353956460952759},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.607367753982544},{"id":"https://openalex.org/C111219384","wikidata":"https://www.wikidata.org/wiki/Q6954384","display_name":"NIST","level":2,"score":0.5927303433418274},{"id":"https://openalex.org/C44280652","wikidata":"https://www.wikidata.org/wiki/Q104837","display_name":"Phase (matter)","level":2,"score":0.5072757601737976},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4928627014160156},{"id":"https://openalex.org/C88485024","wikidata":"https://www.wikidata.org/wiki/Q1054571","display_name":"Cepstrum","level":2,"score":0.48578789830207825},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4466429650783539},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.44325560331344604},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.4228472113609314},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.2576238811016083},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.11132362484931946},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.09990623593330383},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C146978453","wikidata":"https://www.wikidata.org/wiki/Q3798668","display_name":"Aerospace engineering","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp.2018.8461501","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2018.8461501","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W151003953","https://openalex.org/W1522720415","https://openalex.org/W1523138083","https://openalex.org/W1971694955","https://openalex.org/W1992095472","https://openalex.org/W1993177724","https://openalex.org/W1993482042","https://openalex.org/W2001932915","https://openalex.org/W2014893602","https://openalex.org/W2015424351","https://openalex.org/W2026411533","https://openalex.org/W2026704977","https://openalex.org/W2042211079","https://openalex.org/W2078169166","https://openalex.org/W2099625016","https://openalex.org/W2100546383","https://openalex.org/W2104457544","https://openalex.org/W2106051978","https://openalex.org/W2109225367","https://openalex.org/W2109622017","https://openalex.org/W2118180989","https://openalex.org/W2131703294","https://openalex.org/W2160511961","https://openalex.org/W2172287020","https://openalex.org/W2185814970","https://openalex.org/W2288613265","https://openalex.org/W2340176088","https://openalex.org/W2408021097","https://openalex.org/W2509153213","https://openalex.org/W4302458905","https://openalex.org/W6631349102","https://openalex.org/W6650842961","https://openalex.org/W6674960879","https://openalex.org/W6675793180","https://openalex.org/W6683497447","https://openalex.org/W6845844910"],"related_works":["https://openalex.org/W2018086531","https://openalex.org/W1980297060","https://openalex.org/W2387604097","https://openalex.org/W4385672897","https://openalex.org/W2736574136","https://openalex.org/W2373675101","https://openalex.org/W2038216521","https://openalex.org/W106160982","https://openalex.org/W894828327","https://openalex.org/W2136559180"],"abstract_inverted_index":{"In":[0],"this":[1],"paper,":[2],"we":[3],"study":[4],"the":[5,58,68,99,132,139],"role":[6],"of":[7,11,23,85,102,114,122,141],"long-time":[8,36,83],"analytic":[9,37,79,144],"phase":[10,145],"speech":[12,49,86],"signals":[13],"in":[14,39,55,87,126,146],"spoken":[15],"language":[16],"recognition":[17],"(SLR)":[18],"and":[19,75,107,124,134],"employ":[20],"a":[21],"set":[22],"features":[24,47,52,104,118],"termed":[25],"as":[26],"instantaneous":[27],"frequency":[28],"cepstral":[29,62],"coefficients":[30,63],"(IFCC).":[31],"We":[32],"extract":[33],"IFCC":[34,76,103,115],"from":[35,48,72,78,143],"phase,":[38,80],"an":[40],"effort":[41],"to":[42,105],"capture":[43],"long":[44],"range":[45],"acoustic":[46],"signals.":[50],"These":[51],"are":[53,70,77],"used":[54],"combination":[56],"with":[57,93,116],"traditional":[59],"shifted":[60],"delta":[61],"(SDCC)":[64],"for":[65],"SLR.":[66,147],"As":[67],"SDCC":[69,106,133],"extracted":[71],"spectral":[73],"magnitude":[74],"they":[81],"characterize":[82],"information":[84,142],"different":[88],"ways.":[89],"The":[90,112],"experiments":[91],"conducted":[92],"NIST":[94],"LRE":[95],"2017":[96],"task":[97],"reveals":[98],"complementary":[100],"effects":[101],"deep":[108],"bottleneck":[109],"(DBN)":[110],"features.":[111],"fusion":[113],"SDCC/DBN":[117],"delivered":[119],"relative":[120],"improvements":[121],"23.23%":[123],"16.78%":[125],"average":[127],"equal":[128],"error":[129],"rate":[130],"over":[131],"DBN":[135],"features,":[136],"respectively,":[137],"indicating":[138],"benefits":[140]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
