{"id":"https://openalex.org/W4414581923","doi":"https://doi.org/10.48550/arxiv.2505.18980","title":"Improving Anomalous Sound Detection through Pseudo-anomalous Set Selection and Pseudo-label Utilization under Unlabeled Conditions","display_name":"Improving Anomalous Sound Detection through Pseudo-anomalous Set Selection and Pseudo-label Utilization under Unlabeled Conditions","publication_year":2025,"publication_date":"2025-05-25","ids":{"openalex":"https://openalex.org/W4414581923","doi":"https://doi.org/10.48550/arxiv.2505.18980"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2505.18980","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2505.18980","pdf_url":"https://arxiv.org/pdf/2505.18980","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2505.18980","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5074471104","display_name":"Ibuki Kuroyanagi","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Kuroyanagi, Ibuki","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048172594","display_name":"Takuya Fujimura","orcid":"https://orcid.org/0000-0003-1726-8372"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fujimura, Takuya","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042118446","display_name":"Kazuya Takeda","orcid":"https://orcid.org/0000-0002-0330-1787"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Takeda, Kazuya","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5078330211","display_name":"Tomoki Toda","orcid":"https://orcid.org/0000-0001-8146-1279"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Toda, Tomoki","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5074471104"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11220","display_name":"Water Systems and Optimization","score":0.9348000288009644,"subfield":{"id":"https://openalex.org/subfields/2205","display_name":"Civil and Structural Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9298999905586243,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.6410999894142151},{"id":"https://openalex.org/keywords/anomaly-detection","display_name":"Anomaly detection","score":0.608299970626831},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.49540001153945923},{"id":"https://openalex.org/keywords/labeled-data","display_name":"Labeled data","score":0.4902999997138977},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.4668999910354614},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4668000042438507},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.45339998602867126},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.43709999322891235}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7070000171661377},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.6410999894142151},{"id":"https://openalex.org/C739882","wikidata":"https://www.wikidata.org/wiki/Q3560506","display_name":"Anomaly detection","level":2,"score":0.608299970626831},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6014000177383423},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.49540001153945923},{"id":"https://openalex.org/C2776145971","wikidata":"https://www.wikidata.org/wiki/Q30673951","display_name":"Labeled data","level":2,"score":0.4902999997138977},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.48159998655319214},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.4668999910354614},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4668000042438507},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.45339998602867126},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.43709999322891235},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.41260001063346863},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4074999988079071},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.39259999990463257},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.37119999527931213},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.36820000410079956},{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.35199999809265137},{"id":"https://openalex.org/C58489278","wikidata":"https://www.wikidata.org/wiki/Q1172284","display_name":"Data set","level":2,"score":0.33309999108314514},{"id":"https://openalex.org/C2984030306","wikidata":"https://www.wikidata.org/wiki/Q4819857","display_name":"Sound analysis","level":2,"score":0.2711000144481659},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.2567000091075897},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.2515000104904175}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2505.18980","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2505.18980","pdf_url":"https://arxiv.org/pdf/2505.18980","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2505.18980","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2505.18980","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2505.18980","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2505.18980","pdf_url":"https://arxiv.org/pdf/2505.18980","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"This":[0],"paper":[1],"addresses":[2],"performance":[3],"degradation":[4],"in":[5,115,156],"anomalous":[6],"sound":[7],"detection":[8,83,104],"(ASD)":[9],"when":[10],"neither":[11],"sufficiently":[12],"similar":[13],"machine":[14,160],"data":[15,56,138,161],"nor":[16],"operational":[17,80],"state":[18],"labels":[19],"are":[20],"available.":[21],"We":[22],"present":[23],"an":[24,47,121],"integrated":[25],"pipeline":[26],"that":[27],"combines":[28],"three":[29],"complementary":[30],"components":[31],"derived":[32],"from":[33,139],"prior":[34],"work":[35],"and":[36,82,99,151,162],"extends":[37],"them":[38],"to":[39,52,70,73,92,130],"the":[40,58,62,95,108,140,149],"unlabeled":[41,74,116],"ASD":[42,165],"setting.":[43],"First,":[44],"we":[45,66,88],"adapt":[46],"anomaly":[48],"score":[49],"based":[50],"selector":[51],"curate":[53],"external":[54,137],"audio":[55],"resembling":[57],"normal":[59],"sounds":[60,81],"of":[61,79,84,125,153],"target":[63],"machine.":[64],"Second,":[65],"utilize":[67],"triplet":[68],"learning":[69],"assign":[71],"pseudo-labels":[72],"data,":[75],"enabling":[76],"finer":[77],"classification":[78],"subtle":[85],"anomalies.":[86],"Third,":[87],"employ":[89],"iterative":[90],"training":[91],"refine":[93],"both":[94],"pseudo-anomalous":[96,141],"set":[97,142],"selection":[98],"pseudo-label":[100],"assignment,":[101],"progressively":[102],"improving":[103],"accuracy.":[105],"Experiments":[106],"on":[107],"DCASE2022-2024":[109],"Task":[110],"2":[111],"datasets":[112],"demonstrate":[113],"that,":[114],"settings,":[117,135],"our":[118,154],"approach":[119],"achieves":[120],"average":[122],"AUC":[123],"increase":[124],"over":[126],"6.6":[127],"points":[128],"compared":[129],"conventional":[131],"methods.":[132],"In":[133],"labeled":[134],"incorporating":[136],"further":[143],"boosts":[144],"performance.":[145],"These":[146],"results":[147],"highlight":[148],"practicality":[150],"robustness":[152],"methods":[155],"scenarios":[157],"with":[158,171],"scarce":[159],"labels,":[163],"facilitating":[164],"deployment":[166],"across":[167],"diverse":[168],"industrial":[169],"settings":[170],"minimal":[172],"annotation":[173],"effort.":[174]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-10T00:00:00"}
