{"id":"https://openalex.org/W4386765318","doi":"https://doi.org/10.1109/waspaa58266.2023.10248128","title":"Location as Supervision for Weakly Supervised Multi-Channel Source Separation of Machine Sounds","display_name":"Location as Supervision for Weakly Supervised Multi-Channel Source Separation of Machine Sounds","publication_year":2023,"publication_date":"2023-09-15","ids":{"openalex":"https://openalex.org/W4386765318","doi":"https://doi.org/10.1109/waspaa58266.2023.10248128"},"language":"en","primary_location":{"id":"doi:10.1109/waspaa58266.2023.10248128","is_oa":false,"landing_page_url":"https://doi.org/10.1109/waspaa58266.2023.10248128","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://research.aalto.fi/en/publications/fcf159e8-52b6-4529-bc3f-567f36fd870b","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5030863038","display_name":"Ricardo Falcon-Perez","orcid":"https://orcid.org/0009-0006-5871-3363"},"institutions":[{"id":"https://openalex.org/I4210159266","display_name":"Mitsubishi Electric (United States)","ror":"https://ror.org/053jnhe44","country_code":"US","type":"company","lineage":["https://openalex.org/I1306287861","https://openalex.org/I4210133125","https://openalex.org/I4210159266"]},{"id":"https://openalex.org/I9927081","display_name":"Aalto University","ror":"https://ror.org/020hwjq30","country_code":"FI","type":"education","lineage":["https://openalex.org/I9927081"]}],"countries":["FI","US"],"is_corresponding":false,"raw_author_name":"Ricardo Falcon-Perez","raw_affiliation_strings":["Mitsubishi Electric Research Laboratories (MERL),Cambridge,MA,USA","Acoustics Lab, D.I.C.E., Aalto University, Espoo, Finland","Mitsubishi Electric Research Laboratories (MERL), Cambridge, MA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Mitsubishi Electric Research Laboratories (MERL),Cambridge,MA,USA","institution_ids":["https://openalex.org/I4210159266"]},{"raw_affiliation_string":"Acoustics Lab, D.I.C.E., Aalto University, Espoo, Finland","institution_ids":["https://openalex.org/I9927081"]},{"raw_affiliation_string":"Mitsubishi Electric Research Laboratories (MERL), Cambridge, MA, USA","institution_ids":["https://openalex.org/I4210159266"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086940921","display_name":"Gordon Wichern","orcid":"https://orcid.org/0000-0002-8597-6795"},"institutions":[{"id":"https://openalex.org/I4210159266","display_name":"Mitsubishi Electric (United States)","ror":"https://ror.org/053jnhe44","country_code":"US","type":"company","lineage":["https://openalex.org/I1306287861","https://openalex.org/I4210133125","https://openalex.org/I4210159266"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Gordon Wichern","raw_affiliation_strings":["Mitsubishi Electric Research Laboratories (MERL),Cambridge,MA,USA","Mitsubishi Electric Research Laboratories (MERL), Cambridge, MA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Mitsubishi Electric Research Laboratories (MERL),Cambridge,MA,USA","institution_ids":["https://openalex.org/I4210159266"]},{"raw_affiliation_string":"Mitsubishi Electric Research Laboratories (MERL), Cambridge, MA, USA","institution_ids":["https://openalex.org/I4210159266"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102812631","display_name":"Fran\u00e7ois G. Germain","orcid":"https://orcid.org/0000-0002-8973-5315"},"institutions":[{"id":"https://openalex.org/I4210159266","display_name":"Mitsubishi Electric (United States)","ror":"https://ror.org/053jnhe44","country_code":"US","type":"company","lineage":["https://openalex.org/I1306287861","https://openalex.org/I4210133125","https://openalex.org/I4210159266"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Fran\u00e7ois G. Germain","raw_affiliation_strings":["Mitsubishi Electric Research Laboratories (MERL),Cambridge,MA,USA","Mitsubishi Electric Research Laboratories (MERL), Cambridge, MA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Mitsubishi Electric Research Laboratories (MERL),Cambridge,MA,USA","institution_ids":["https://openalex.org/I4210159266"]},{"raw_affiliation_string":"Mitsubishi Electric Research Laboratories (MERL), Cambridge, MA, USA","institution_ids":["https://openalex.org/I4210159266"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5064097430","display_name":"Jonathan Le Roux","orcid":"https://orcid.org/0000-0002-0158-2837"},"institutions":[{"id":"https://openalex.org/I4210159266","display_name":"Mitsubishi Electric (United States)","ror":"https://ror.org/053jnhe44","country_code":"US","type":"company","lineage":["https://openalex.org/I1306287861","https://openalex.org/I4210133125","https://openalex.org/I4210159266"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jonathan Le Roux","raw_affiliation_strings":["Mitsubishi Electric Research Laboratories (MERL),Cambridge,MA,USA","Mitsubishi Electric Research Laboratories (MERL), Cambridge, MA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Mitsubishi Electric Research Laboratories (MERL),Cambridge,MA,USA","institution_ids":["https://openalex.org/I4210159266"]},{"raw_affiliation_string":"Mitsubishi Electric Research Laboratories (MERL), Cambridge, MA, USA","institution_ids":["https://openalex.org/I4210159266"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.1848,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.43450539,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9902999997138977,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7742398381233215},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.742559015750885},{"id":"https://openalex.org/keywords/source-separation","display_name":"Source separation","score":0.7216368913650513},{"id":"https://openalex.org/keywords/microphone","display_name":"Microphone","score":0.560480535030365},{"id":"https://openalex.org/keywords/microphone-array","display_name":"Microphone array","score":0.5340707898139954},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.5338324904441833},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5279777646064758},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.4785328805446625},{"id":"https://openalex.org/keywords/blind-signal-separation","display_name":"Blind signal separation","score":0.47623661160469055},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.4723426103591919},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4334483742713928},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4263386130332947},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.41911688446998596},{"id":"https://openalex.org/keywords/schematic","display_name":"Schematic","score":0.4148351848125458},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.403509259223938},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.10870888829231262},{"id":"https://openalex.org/keywords/electronic-engineering","display_name":"Electronic engineering","score":0.10306993126869202}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7742398381233215},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.742559015750885},{"id":"https://openalex.org/C2776864781","wikidata":"https://www.wikidata.org/wiki/Q52617913","display_name":"Source separation","level":2,"score":0.7216368913650513},{"id":"https://openalex.org/C2778263558","wikidata":"https://www.wikidata.org/wiki/Q46384","display_name":"Microphone","level":3,"score":0.560480535030365},{"id":"https://openalex.org/C2778806681","wikidata":"https://www.wikidata.org/wiki/Q907293","display_name":"Microphone array","level":4,"score":0.5340707898139954},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.5338324904441833},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5279777646064758},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.4785328805446625},{"id":"https://openalex.org/C120317606","wikidata":"https://www.wikidata.org/wiki/Q17105967","display_name":"Blind signal separation","level":3,"score":0.47623661160469055},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.4723426103591919},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4334483742713928},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4263386130332947},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.41911688446998596},{"id":"https://openalex.org/C192328126","wikidata":"https://www.wikidata.org/wiki/Q4514647","display_name":"Schematic","level":2,"score":0.4148351848125458},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.403509259223938},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.10870888829231262},{"id":"https://openalex.org/C24326235","wikidata":"https://www.wikidata.org/wiki/Q126095","display_name":"Electronic engineering","level":1,"score":0.10306993126869202},{"id":"https://openalex.org/C68115822","wikidata":"https://www.wikidata.org/wiki/Q1068172","display_name":"Sound pressure","level":2,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/waspaa58266.2023.10248128","is_oa":false,"landing_page_url":"https://doi.org/10.1109/waspaa58266.2023.10248128","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)","raw_type":"proceedings-article"},{"id":"pmh:oai:aaltodoc.aalto.fi:123456789/124292","is_oa":true,"landing_page_url":"https://research.aalto.fi/en/publications/fcf159e8-52b6-4529-bc3f-567f36fd870b","pdf_url":null,"source":{"id":"https://openalex.org/S4306401662","display_name":"Aaltodoc (Aalto University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I9927081","host_organization_name":"Aalto University","host_organization_lineage":["https://openalex.org/I9927081"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"acceptedVersion"}],"best_oa_location":{"id":"pmh:oai:aaltodoc.aalto.fi:123456789/124292","is_oa":true,"landing_page_url":"https://research.aalto.fi/en/publications/fcf159e8-52b6-4529-bc3f-567f36fd870b","pdf_url":null,"source":{"id":"https://openalex.org/S4306401662","display_name":"Aaltodoc (Aalto University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I9927081","host_organization_name":"Aalto University","host_organization_lineage":["https://openalex.org/I9927081"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"acceptedVersion"},"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","score":0.41999998688697815,"id":"https://metadata.un.org/sdg/9"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":45,"referenced_works":["https://openalex.org/W1601124178","https://openalex.org/W2221409856","https://openalex.org/W2763188033","https://openalex.org/W2771164042","https://openalex.org/W2897802972","https://openalex.org/W2900893004","https://openalex.org/W2902738348","https://openalex.org/W2909607850","https://openalex.org/W2962970794","https://openalex.org/W2980402953","https://openalex.org/W2984935418","https://openalex.org/W2988200020","https://openalex.org/W2990666817","https://openalex.org/W3011424113","https://openalex.org/W3015201698","https://openalex.org/W3016244615","https://openalex.org/W3034883497","https://openalex.org/W3092796334","https://openalex.org/W3093839391","https://openalex.org/W3095263845","https://openalex.org/W3097034112","https://openalex.org/W3097906045","https://openalex.org/W3104704316","https://openalex.org/W3121952123","https://openalex.org/W3153985003","https://openalex.org/W3157899172","https://openalex.org/W3158652463","https://openalex.org/W3160751854","https://openalex.org/W3198425604","https://openalex.org/W3199957557","https://openalex.org/W3201698955","https://openalex.org/W3207860153","https://openalex.org/W4225288502","https://openalex.org/W4296068764","https://openalex.org/W4297841581","https://openalex.org/W4320204617","https://openalex.org/W4372347386","https://openalex.org/W6745962113","https://openalex.org/W6768852591","https://openalex.org/W6778247133","https://openalex.org/W6779961064","https://openalex.org/W6784139575","https://openalex.org/W6784499681","https://openalex.org/W6810824476","https://openalex.org/W6850002427"],"related_works":["https://openalex.org/W1509813908","https://openalex.org/W1879255185","https://openalex.org/W2031820693","https://openalex.org/W3024816962","https://openalex.org/W973023320","https://openalex.org/W2120442551","https://openalex.org/W2769861442","https://openalex.org/W1910172735","https://openalex.org/W1980506188","https://openalex.org/W1510462426"],"abstract_inverted_index":{"In":[0],"this":[1],"work,":[2],"we":[3,78],"are":[4,125],"interested":[5],"in":[6,17,29,162],"learning":[7,72],"a":[8,23,41,60,92,118,172],"model":[9,173,185],"to":[10,34,73,105,121,176,191],"separate":[11,74],"sources":[12,104,136],"that":[13,25,95],"cannot":[14,79],"be":[15],"recorded":[16],"isolation,":[18],"such":[19,58],"as":[20,59,68,87],"parts":[21],"of":[22,40,46,110,133,145],"machine":[24,33,153],"must":[26],"run":[27],"simultaneously":[28],"order":[30],"for":[31,71,112,180],"the":[32,38,47,65,75,81,97,102,107,134,143,156],"function.":[35],"We":[36,90,141],"assume":[37],"presence":[39],"microphone":[42],"array":[43],"and":[44,115,189],"knowledge":[45],"source":[48,66,83,178,197],"locations":[49,67],"(potentially":[50],"obtained":[51],"from":[52,101,155],"schematics":[53],"or":[54,202],"an":[55],"auxiliary":[56],"sensor":[57],"camera).":[61],"Our":[62],"method":[63],"uses":[64],"weak":[69],"labels":[70],"sources,":[76],"since":[77],"obtain":[80],"isolated":[82,177,196],"signals":[84,179,198],"typically":[85],"used":[86],"training":[88],"targets.":[89],"propose":[91],"loss":[93,120],"function":[94],"requires":[96],"directional":[98],"features":[99],"computed":[100],"separated":[103,135],"match":[106],"true":[108],"direction":[109],"arrival":[111],"each":[113],"source,":[114],"also":[116],"include":[117],"reconstruction":[119],"ensure":[122],"all":[123],"frequencies":[124],"taken":[126],"into":[127],"account":[128],"by":[129,138],"at":[130],"least":[131],"one":[132],"output":[137],"our":[139,146,182],"model.":[140],"benchmark":[142],"performance":[144],"algorithm":[147],"using":[148,152],"synthetic":[149],"mixtures":[150],"created":[151],"sounds":[154],"DCASE":[157],"2021":[158],"Task":[159],"2":[160],"dataset":[161],"challenging":[163],"reverberant":[164],"conditions.":[165],"While":[166],"reaching":[167],"lower":[168],"objective":[169],"scores":[170],"than":[171],"with":[174],"access":[175],"training,":[181],"proposed":[183],"weakly-supervised":[184],"obtains":[186],"promising":[187],"results":[188],"applies":[190],"industrial":[192],"scenarios":[193],"where":[194],"collecting":[195],"is":[199],"prohibitively":[200],"expensive":[201],"impossible.":[203]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
