{"id":"https://openalex.org/W4390636217","doi":"https://doi.org/10.1186/s13636-023-00324-4","title":"Significance of relative phase features for shouted and normal speech classification","display_name":"Significance of relative phase features for shouted and normal speech classification","publication_year":2024,"publication_date":"2024-01-06","ids":{"openalex":"https://openalex.org/W4390636217","doi":"https://doi.org/10.1186/s13636-023-00324-4"},"language":"en","primary_location":{"id":"doi:10.1186/s13636-023-00324-4","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13636-023-00324-4","pdf_url":"https://asmp-eurasipjournals.springeropen.com/counter/pdf/10.1186/s13636-023-00324-4","source":{"id":"https://openalex.org/S19605986","display_name":"EURASIP Journal on Audio Speech and Music Processing","issn_l":"1687-4714","issn":["1687-4714","1687-4722"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Audio, Speech, and Music Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://asmp-eurasipjournals.springeropen.com/counter/pdf/10.1186/s13636-023-00324-4","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5032892004","display_name":"Khomdet Phapatanaburi","orcid":"https://orcid.org/0000-0002-6487-2073"},"institutions":[{"id":"https://openalex.org/I1285782058","display_name":"Rajamangala University of Technology Isan","ror":"https://ror.org/04a2rz655","country_code":"TH","type":"education","lineage":["https://openalex.org/I1285782058"]}],"countries":["TH"],"is_corresponding":false,"raw_author_name":"Khomdet Phapatanaburi","raw_affiliation_strings":["Department of Telecommunication Engineering, Faculty of Engineering and Technology, Rajamangala University of Technology Isan, Nakhonrachasrima, 30000, Thailand","Department of Telecommunication Engineering, Faculty of Engineering and Technology, Rajamangala University of Technology Isan, Nakhonrachasrima, Thailand"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Telecommunication Engineering, Faculty of Engineering and Technology, Rajamangala University of Technology Isan, Nakhonrachasrima, 30000, Thailand","institution_ids":["https://openalex.org/I1285782058"]},{"raw_affiliation_string":"Department of Telecommunication Engineering, Faculty of Engineering and Technology, Rajamangala University of Technology Isan, Nakhonrachasrima, Thailand","institution_ids":["https://openalex.org/I1285782058"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050763764","display_name":"Longbiao Wang","orcid":"https://orcid.org/0000-0002-4005-5036"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Longbiao Wang","raw_affiliation_strings":["Tianjin Key Laboratory of Cognitive Computing and Application, College of Intelligence and Computing, Tianjin University, Tianjin, 300350, China","Tianjin Key Laboratory of Cognitive Computing and Application, College of Intelligence and Computing, Tianjin University, Tianjin, China"],"raw_orcid":"https://orcid.org/0000-0002-4005-5036","affiliations":[{"raw_affiliation_string":"Tianjin Key Laboratory of Cognitive Computing and Application, College of Intelligence and Computing, Tianjin University, Tianjin, 300350, China","institution_ids":["https://openalex.org/I162868743"]},{"raw_affiliation_string":"Tianjin Key Laboratory of Cognitive Computing and Application, College of Intelligence and Computing, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100457438","display_name":"Meng Liu","orcid":"https://orcid.org/0000-0002-1582-5764"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Meng Liu","raw_affiliation_strings":["Tianjin Key Laboratory of Cognitive Computing and Application, College of Intelligence and Computing, Tianjin University, Tianjin, 300350, China","Tianjin Key Laboratory of Cognitive Computing and Application, College of Intelligence and Computing, Tianjin University, Tianjin, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tianjin Key Laboratory of Cognitive Computing and Application, College of Intelligence and Computing, Tianjin University, Tianjin, 300350, China","institution_ids":["https://openalex.org/I162868743"]},{"raw_affiliation_string":"Tianjin Key Laboratory of Cognitive Computing and Application, College of Intelligence and Computing, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018428974","display_name":"Seiichi Nakagawa","orcid":"https://orcid.org/0000-0002-6533-5536"},"institutions":[{"id":"https://openalex.org/I184937672","display_name":"Chubu University","ror":"https://ror.org/02sps0775","country_code":"JP","type":"education","lineage":["https://openalex.org/I184937672"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Seiichi Nakagawa","raw_affiliation_strings":["Faculty of Engineering, Chubu University, Kasugai, Aichi, 487-8501, Japan","Faculty of Engineering, Chubu University, Kasugai, Aichi, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Engineering, Chubu University, Kasugai, Aichi, 487-8501, Japan","institution_ids":["https://openalex.org/I184937672"]},{"raw_affiliation_string":"Faculty of Engineering, Chubu University, Kasugai, Aichi, Japan","institution_ids":["https://openalex.org/I184937672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019645995","display_name":"Talit Jumphoo","orcid":"https://orcid.org/0000-0003-4800-648X"},"institutions":[{"id":"https://openalex.org/I82475049","display_name":"Suranaree University of Technology","ror":"https://ror.org/05sgb8g78","country_code":"TH","type":"education","lineage":["https://openalex.org/I82475049"]}],"countries":["TH"],"is_corresponding":false,"raw_author_name":"Talit Jumphoo","raw_affiliation_strings":["School of Telecommunication Engineering, Suranaree University of Technology, Nakhon Ratchasima, 30000, Thailand","School of Telecommunication Engineering, Suranaree University of Technology, Nakhon Ratchasima, Thailand"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Telecommunication Engineering, Suranaree University of Technology, Nakhon Ratchasima, 30000, Thailand","institution_ids":["https://openalex.org/I82475049"]},{"raw_affiliation_string":"School of Telecommunication Engineering, Suranaree University of Technology, Nakhon Ratchasima, Thailand","institution_ids":["https://openalex.org/I82475049"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5044429602","display_name":"Peerapong Uthansakul","orcid":"https://orcid.org/0000-0002-7108-9263"},"institutions":[{"id":"https://openalex.org/I82475049","display_name":"Suranaree University of Technology","ror":"https://ror.org/05sgb8g78","country_code":"TH","type":"education","lineage":["https://openalex.org/I82475049"]}],"countries":["TH"],"is_corresponding":false,"raw_author_name":"Peerapong Uthansakul","raw_affiliation_strings":["School of Telecommunication Engineering, Suranaree University of Technology, Nakhon Ratchasima, 30000, Thailand","School of Telecommunication Engineering, Suranaree University of Technology, Nakhon Ratchasima, Thailand"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Telecommunication Engineering, Suranaree University of Technology, Nakhon Ratchasima, 30000, Thailand","institution_ids":["https://openalex.org/I82475049"]},{"raw_affiliation_string":"School of Telecommunication Engineering, Suranaree University of Technology, Nakhon Ratchasima, Thailand","institution_ids":["https://openalex.org/I82475049"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5050763764"],"corresponding_institution_ids":["https://openalex.org/I162868743"],"apc_list":{"value":1115,"currency":"GBP","value_usd":1367},"apc_paid":{"value":1115,"currency":"GBP","value_usd":1367},"fwci":2.2028,"has_fulltext":true,"cited_by_count":7,"citation_normalized_percentile":{"value":0.88546062,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":"2024","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9868000149726868,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9864000082015991,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mel-frequency-cepstrum","display_name":"Mel-frequency cepstrum","score":0.8067083954811096},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.6704519391059875},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5686160326004028},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5565450191497803},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5502996444702148},{"id":"https://openalex.org/keywords/linear-prediction","display_name":"Linear prediction","score":0.5247007608413696},{"id":"https://openalex.org/keywords/cepstrum","display_name":"Cepstrum","score":0.47096922993659973},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.46589505672454834},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.42842981219291687}],"concepts":[{"id":"https://openalex.org/C151989614","wikidata":"https://www.wikidata.org/wiki/Q440370","display_name":"Mel-frequency cepstrum","level":3,"score":0.8067083954811096},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.6704519391059875},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5686160326004028},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5565450191497803},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5502996444702148},{"id":"https://openalex.org/C131109320","wikidata":"https://www.wikidata.org/wiki/Q581012","display_name":"Linear prediction","level":2,"score":0.5247007608413696},{"id":"https://openalex.org/C88485024","wikidata":"https://www.wikidata.org/wiki/Q1054571","display_name":"Cepstrum","level":2,"score":0.47096922993659973},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.46589505672454834},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42842981219291687},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1186/s13636-023-00324-4","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13636-023-00324-4","pdf_url":"https://asmp-eurasipjournals.springeropen.com/counter/pdf/10.1186/s13636-023-00324-4","source":{"id":"https://openalex.org/S19605986","display_name":"EURASIP Journal on Audio Speech and Music Processing","issn_l":"1687-4714","issn":["1687-4714","1687-4722"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Audio, Speech, and Music Processing","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:00f296c9c67e48219caa4a7c2ced5455","is_oa":true,"landing_page_url":"https://doaj.org/article/00f296c9c67e48219caa4a7c2ced5455","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"EURASIP Journal on Audio, Speech, and Music Processing, Vol 2024, Iss 1, Pp 1-14 (2024)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1186/s13636-023-00324-4","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13636-023-00324-4","pdf_url":"https://asmp-eurasipjournals.springeropen.com/counter/pdf/10.1186/s13636-023-00324-4","source":{"id":"https://openalex.org/S19605986","display_name":"EURASIP Journal on Audio Speech and Music Processing","issn_l":"1687-4714","issn":["1687-4714","1687-4722"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Audio, Speech, and Music Processing","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.4099999964237213,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[{"id":"https://openalex.org/G7732325329","display_name":null,"funder_award_id":"62176182","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320322574","display_name":"Suranaree University of Technology","ror":"https://ror.org/05sgb8g78"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4390636217.pdf"},"referenced_works_count":39,"referenced_works":["https://openalex.org/W1555937754","https://openalex.org/W1967429593","https://openalex.org/W1992475611","https://openalex.org/W2002311796","https://openalex.org/W2004916802","https://openalex.org/W2022895291","https://openalex.org/W2036015554","https://openalex.org/W2080278484","https://openalex.org/W2084339293","https://openalex.org/W2095176743","https://openalex.org/W2109000787","https://openalex.org/W2112164460","https://openalex.org/W2125514156","https://openalex.org/W2129244720","https://openalex.org/W2145212718","https://openalex.org/W2162614059","https://openalex.org/W2168609109","https://openalex.org/W2296529392","https://openalex.org/W2345844407","https://openalex.org/W2406845569","https://openalex.org/W2513927927","https://openalex.org/W2564171085","https://openalex.org/W2586709666","https://openalex.org/W2606406919","https://openalex.org/W2606977969","https://openalex.org/W2613770330","https://openalex.org/W2747872086","https://openalex.org/W2753897885","https://openalex.org/W2789949544","https://openalex.org/W2805352943","https://openalex.org/W2808513547","https://openalex.org/W2921982339","https://openalex.org/W2944025308","https://openalex.org/W2947119368","https://openalex.org/W2952384848","https://openalex.org/W2989825986","https://openalex.org/W2995655945","https://openalex.org/W2997139369","https://openalex.org/W3007267003"],"related_works":["https://openalex.org/W2018086531","https://openalex.org/W1980297060","https://openalex.org/W2387604097","https://openalex.org/W2787035864","https://openalex.org/W2373675101","https://openalex.org/W106160982","https://openalex.org/W2359140082","https://openalex.org/W1556565948","https://openalex.org/W2074132948","https://openalex.org/W2160511961"],"abstract_inverted_index":{"Abstract":[0],"Shouted":[1],"and":[2,23,74,85,118,131,146,166,212,233],"normal":[3,86,153,254],"speech":[4,87,155,252],"classification":[5,141],"plays":[6],"an":[7,216],"important":[8],"role":[9],"in":[10,249],"many":[11],"speech-related":[12],"applications.":[13],"The":[14,50,103,143,158],"existing":[15],"works":[16],"are":[17,28,56,81,148],"often":[18],"based":[19],"on":[20],"magnitude-based":[21,132],"features":[22,41,120,133,168,214,236,248],"ignore":[24],"phase-based":[25,40,61],"features,":[26,62,80,205],"which":[27],"directly":[29],"related":[30],"to":[31,112,121,137,202],"magnitude":[32],"information.":[33],"In":[34],"this":[35,54],"paper,":[36],"the":[37,45,97,107,114,140,151,163,173,182,193,206,210,227,231,234,244],"importance":[38,245],"of":[39,47,53,106,129,175,192,209,230,246],"is":[42,111,134],"explored":[43,82],"for":[44,83,172],"detection":[46,174,218],"shouted":[48,84,123,152,176,251],"speech.":[49,124,177,255],"novel":[51],"contributions":[52],"work":[55],"as":[57],"follows.":[58],"(1)":[59],"Three":[60],"namely,":[63],"relative":[64],"phase":[65],"(RP),":[66],"linear":[67,75],"prediction":[68,76],"analysis":[69,221],"estimated":[70],"speech-based":[71],"RP":[72,78,94,100,117,247],"(LPAES-RP)":[73],"residual-based":[77],"(LPR-RP)":[79],"classification.":[88,240],"(2)":[89],"We":[90,178],"propose":[91],"a":[92],"new":[93],"feature,":[95],"called":[96],"glottal":[98],"source-based":[99],"(GRP)":[101],"feature.":[102,199],"main":[104],"idea":[105],"proposed":[108,144,183],"GRP":[109,184],"feature":[110,145,185],"exploit":[113],"difference":[115],"between":[116],"LPAES-RP":[119],"detect":[122],"(3)":[125],"A":[126],"score":[127,207,228],"combination":[128,147,208,229],"phase-":[130],"also":[135,179],"employed":[136],"further":[138],"improve":[139],"performance.":[142,219],"evaluated":[149],"using":[150,203],"electroglottograph":[154],"(SNE-Speech)":[156],"corpus.":[157],"experimental":[159],"findings":[160],"show":[161,243],"that":[162,181,226],"RP,":[164],"LPAES-RP,":[165],"LPR-RP":[167],"provide":[169,187],"promising":[170],"results":[171,189],"find":[180],"can":[186],"better":[188],"than":[190],"those":[191],"standard":[194],"mel-frequency":[195],"cepstral":[196],"coefficient":[197],"(MFCC)":[198],"Moreover,":[200],"compared":[201],"individual":[204],"MFCC":[211,232],"RP/LPAES-RP/LPR-RP/GRP":[213],"yields":[215],"improved":[217],"Performance":[220],"under":[222],"noisy":[223],"environments":[224],"shows":[225],"RP/LPAES-RP/LPR-RP":[235],"gives":[237],"more":[238],"robust":[239],"These":[241],"outcomes":[242],"distinguishing":[250],"from":[253]},"counts_by_year":[{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":3}],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
