{"id":"https://openalex.org/W4416799175","doi":"https://doi.org/10.1109/apsipaasc65261.2025.11249328","title":"Anomalous Sound Detection Using Time-Frequency Derivative of Instantaneous Phase Features","display_name":"Anomalous Sound Detection Using Time-Frequency Derivative of Instantaneous Phase Features","publication_year":2025,"publication_date":"2025-10-22","ids":{"openalex":"https://openalex.org/W4416799175","doi":"https://doi.org/10.1109/apsipaasc65261.2025.11249328"},"language":null,"primary_location":{"id":"doi:10.1109/apsipaasc65261.2025.11249328","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apsipaasc65261.2025.11249328","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 Asia Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101962558","display_name":"Thanh D. Vo","orcid":"https://orcid.org/0000-0002-1797-6320"},"institutions":[{"id":"https://openalex.org/I177738480","display_name":"Japan Advanced Institute of Science and Technology","ror":"https://ror.org/03frj4r98","country_code":"JP","type":"education","lineage":["https://openalex.org/I177738480"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Tran-Quang-Tuan Vo","raw_affiliation_strings":["Japan Advanced Institute of Science and Technology,Nomi,Ishikawa,Japan,923-1292"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Japan Advanced Institute of Science and Technology,Nomi,Ishikawa,Japan,923-1292","institution_ids":["https://openalex.org/I177738480"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111119730","display_name":"Quoc\u2010Huy Nguyen","orcid":"https://orcid.org/0000-0003-4996-628X"},"institutions":[{"id":"https://openalex.org/I177738480","display_name":"Japan Advanced Institute of Science and Technology","ror":"https://ror.org/03frj4r98","country_code":"JP","type":"education","lineage":["https://openalex.org/I177738480"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Quoc-Huy Nguyen","raw_affiliation_strings":["Japan Advanced Institute of Science and Technology,Nomi,Ishikawa,Japan,923-1292"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Japan Advanced Institute of Science and Technology,Nomi,Ishikawa,Japan,923-1292","institution_ids":["https://openalex.org/I177738480"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5014199725","display_name":"Masashi Unoki","orcid":"https://orcid.org/0000-0002-6605-2052"},"institutions":[{"id":"https://openalex.org/I177738480","display_name":"Japan Advanced Institute of Science and Technology","ror":"https://ror.org/03frj4r98","country_code":"JP","type":"education","lineage":["https://openalex.org/I177738480"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Masashi Unoki","raw_affiliation_strings":["Japan Advanced Institute of Science and Technology,Nomi,Ishikawa,Japan,923-1292"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Japan Advanced Institute of Science and Technology,Nomi,Ishikawa,Japan,923-1292","institution_ids":["https://openalex.org/I177738480"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.17645033,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"501","last_page":"506"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.6205999851226807,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.6205999851226807,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10220","display_name":"Machine Fault Diagnosis Techniques","score":0.08399999886751175,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.07569999992847443,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.5753999948501587},{"id":"https://openalex.org/keywords/detector","display_name":"Detector","score":0.5745999813079834},{"id":"https://openalex.org/keywords/amplitude","display_name":"Amplitude","score":0.5291000008583069},{"id":"https://openalex.org/keywords/interpolation","display_name":"Interpolation (computer graphics)","score":0.5289999842643738},{"id":"https://openalex.org/keywords/phase","display_name":"Phase (matter)","score":0.5228000283241272},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5048999786376953},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4864000082015991},{"id":"https://openalex.org/keywords/sound","display_name":"Sound (geography)","score":0.4514000117778778}],"concepts":[{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.5753999948501587},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.5745999813079834},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5636000037193298},{"id":"https://openalex.org/C180205008","wikidata":"https://www.wikidata.org/wiki/Q159190","display_name":"Amplitude","level":2,"score":0.5291000008583069},{"id":"https://openalex.org/C137800194","wikidata":"https://www.wikidata.org/wiki/Q11713455","display_name":"Interpolation (computer graphics)","level":3,"score":0.5289999842643738},{"id":"https://openalex.org/C44280652","wikidata":"https://www.wikidata.org/wiki/Q104837","display_name":"Phase (matter)","level":2,"score":0.5228000283241272},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.521399974822998},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5048999786376953},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4864000082015991},{"id":"https://openalex.org/C203718221","wikidata":"https://www.wikidata.org/wiki/Q491713","display_name":"Sound (geography)","level":2,"score":0.4514000117778778},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4327000081539154},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.40290001034736633},{"id":"https://openalex.org/C8038995","wikidata":"https://www.wikidata.org/wiki/Q1152135","display_name":"Unsupervised learning","level":2,"score":0.4027999937534332},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.39570000767707825},{"id":"https://openalex.org/C58471807","wikidata":"https://www.wikidata.org/wiki/Q327120","display_name":"Receiver operating characteristic","level":2,"score":0.37119999527931213},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3400999903678894},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.33739998936653137},{"id":"https://openalex.org/C137270730","wikidata":"https://www.wikidata.org/wiki/Q120811","display_name":"Detection theory","level":3,"score":0.335099995136261},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.32690000534057617},{"id":"https://openalex.org/C111771559","wikidata":"https://www.wikidata.org/wiki/Q66295","display_name":"Derivative (finance)","level":2,"score":0.311599999666214},{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.3059999942779541},{"id":"https://openalex.org/C2984030306","wikidata":"https://www.wikidata.org/wiki/Q4819857","display_name":"Sound analysis","level":2,"score":0.290800005197525},{"id":"https://openalex.org/C148043351","wikidata":"https://www.wikidata.org/wiki/Q4456944","display_name":"Current (fluid)","level":2,"score":0.27889999747276306},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.27810001373291016},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.27379998564720154},{"id":"https://openalex.org/C110086884","wikidata":"https://www.wikidata.org/wiki/Q2085341","display_name":"Phase detector","level":3,"score":0.2515999972820282}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/apsipaasc65261.2025.11249328","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apsipaasc65261.2025.11249328","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 Asia Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":14,"referenced_works":["https://openalex.org/W2060539877","https://openalex.org/W2982294822","https://openalex.org/W2997122788","https://openalex.org/W3015356122","https://openalex.org/W3130472073","https://openalex.org/W4224917958","https://openalex.org/W4225274992","https://openalex.org/W4290943464","https://openalex.org/W4293363567","https://openalex.org/W4383899664","https://openalex.org/W4392903829","https://openalex.org/W4406859079","https://openalex.org/W4410738511","https://openalex.org/W4410763185"],"related_works":[],"abstract_inverted_index":{"Anomalous":[0],"sound":[1,25],"detection":[2],"(ASD)":[3],"plays":[4],"a":[5],"crucial":[6],"role":[7],"in":[8,33,152,164],"predictive":[9],"maintenance":[10],"for":[11,110],"industrial":[12,34,169],"machines,":[13],"enabling":[14],"the":[15,22,28,37,53,57,63,91,94,118,122,125,134,141],"monitoring":[16],"of":[17,24,30,39,56,93,96],"their":[18],"health":[19],"status":[20],"through":[21],"analysis":[23],"signals.":[26],"With":[27],"diversity":[29],"anomalous":[31,166],"sounds":[32,167],"environments":[35],"and":[36,102],"scarcity":[38],"labeled":[40],"data,":[41],"unsupervised":[42,158],"learning":[43,47],"that":[44,145,160],"leverages":[45],"deep":[46],"techniques":[48],"demonstrates":[49],"robust":[50],"performance.":[51],"However,":[52],"entire":[54],"performance":[55],"ASD":[58,73],"detector":[59],"depends":[60],"significantly":[61],"on":[62,68,76,85,117,140],"front":[64],"end,":[65],"which":[66],"concentrates":[67],"feature":[69],"extraction.":[70],"While":[71],"most":[72],"systems":[74],"rely":[75],"amplitude":[77,162],"information,":[78],"there":[79],"has":[80],"been":[81],"relatively":[82],"little":[83],"focus":[84],"phase":[86,98],"information.":[87],"This":[88],"study":[89],"proposes":[90],"use":[92],"derivatives":[95],"instantaneous":[97],"along":[99],"time,":[100],"frequency,":[101],"time-frequency,":[103],"incorporating":[104],"an":[105,150],"Interpolation":[106],"Deep":[107],"Neural":[108],"Network":[109],"ASD.":[111],"The":[112,137],"experimental":[113,138],"procedures":[114],"are":[115],"conducted":[116],"MIMII":[119,142],"dataset,":[120],"with":[121],"area":[123],"under":[124],"receiver":[126],"operating":[127],"characteristic":[128],"curve":[129],"(ROC":[130],"AUC)":[131],"serving":[132],"as":[133],"evaluation":[135],"metric.":[136],"results":[139],"dataset":[143],"demonstrate":[144],"our":[146],"proposed":[147,157],"method":[148],"achieves":[149],"improvement":[151],"AUC":[153],"over":[154],"other":[155],"recently":[156],"methods":[159],"utilize":[161],"information":[163],"detecting":[165],"from":[168],"machines.":[170]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-11-28T00:00:00"}
