{"id":"https://openalex.org/W2962924597","doi":"https://doi.org/10.23919/eusipco.2018.8553198","title":"Capsule Routing for Sound Event Detection","display_name":"Capsule Routing for Sound Event Detection","publication_year":2018,"publication_date":"2018-09-01","ids":{"openalex":"https://openalex.org/W2962924597","doi":"https://doi.org/10.23919/eusipco.2018.8553198","mag":"2962924597"},"language":"en","primary_location":{"id":"doi:10.23919/eusipco.2018.8553198","is_oa":false,"landing_page_url":"https://doi.org/10.23919/eusipco.2018.8553198","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 26th European Signal Processing Conference (EUSIPCO)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5056441203","display_name":"Turab Iqbal","orcid":"https://orcid.org/0000-0003-3393-2544"},"institutions":[{"id":"https://openalex.org/I28290843","display_name":"University of Surrey","ror":"https://ror.org/00ks66431","country_code":"GB","type":"education","lineage":["https://openalex.org/I28290843"]},{"id":"https://openalex.org/I4210121626","display_name":"Signal Processing (United States)","ror":"https://ror.org/021gzyw51","country_code":"US","type":"company","lineage":["https://openalex.org/I4210121626"]}],"countries":["GB","US"],"is_corresponding":true,"raw_author_name":"Turab Iqbal","raw_affiliation_strings":["Speech and Signal Processing, University of Surrey"],"affiliations":[{"raw_affiliation_string":"Speech and Signal Processing, University of Surrey","institution_ids":["https://openalex.org/I28290843","https://openalex.org/I4210121626"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101467338","display_name":"Yong Xu","orcid":"https://orcid.org/0000-0003-4944-6890"},"institutions":[{"id":"https://openalex.org/I4210121626","display_name":"Signal Processing (United States)","ror":"https://ror.org/021gzyw51","country_code":"US","type":"company","lineage":["https://openalex.org/I4210121626"]},{"id":"https://openalex.org/I28290843","display_name":"University of Surrey","ror":"https://ror.org/00ks66431","country_code":"GB","type":"education","lineage":["https://openalex.org/I28290843"]}],"countries":["GB","US"],"is_corresponding":false,"raw_author_name":"Yong Xu","raw_affiliation_strings":["Speech and Signal Processing, University of Surrey"],"affiliations":[{"raw_affiliation_string":"Speech and Signal Processing, University of Surrey","institution_ids":["https://openalex.org/I28290843","https://openalex.org/I4210121626"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072482416","display_name":"Qiuqiang Kong","orcid":"https://orcid.org/0000-0003-2864-0475"},"institutions":[{"id":"https://openalex.org/I28290843","display_name":"University of Surrey","ror":"https://ror.org/00ks66431","country_code":"GB","type":"education","lineage":["https://openalex.org/I28290843"]},{"id":"https://openalex.org/I4210121626","display_name":"Signal Processing (United States)","ror":"https://ror.org/021gzyw51","country_code":"US","type":"company","lineage":["https://openalex.org/I4210121626"]}],"countries":["GB","US"],"is_corresponding":false,"raw_author_name":"Qiuqiang Kong","raw_affiliation_strings":["Speech and Signal Processing, University of Surrey"],"affiliations":[{"raw_affiliation_string":"Speech and Signal Processing, University of Surrey","institution_ids":["https://openalex.org/I28290843","https://openalex.org/I4210121626"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100676721","display_name":"Wenwu Wang","orcid":"https://orcid.org/0000-0002-8393-5703"},"institutions":[{"id":"https://openalex.org/I4210121626","display_name":"Signal Processing (United States)","ror":"https://ror.org/021gzyw51","country_code":"US","type":"company","lineage":["https://openalex.org/I4210121626"]},{"id":"https://openalex.org/I28290843","display_name":"University of Surrey","ror":"https://ror.org/00ks66431","country_code":"GB","type":"education","lineage":["https://openalex.org/I28290843"]}],"countries":["GB","US"],"is_corresponding":false,"raw_author_name":"Wenwu Wang","raw_affiliation_strings":["Speech and Signal Processing, University of Surrey"],"affiliations":[{"raw_affiliation_string":"Speech and Signal Processing, University of Surrey","institution_ids":["https://openalex.org/I28290843","https://openalex.org/I4210121626"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5056441203"],"corresponding_institution_ids":["https://openalex.org/I28290843","https://openalex.org/I4210121626"],"apc_list":null,"apc_paid":null,"fwci":4.2937,"has_fulltext":false,"cited_by_count":36,"citation_normalized_percentile":{"value":0.95418683,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"2255","last_page":"2259"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/overfitting","display_name":"Overfitting","score":0.8182542324066162},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7360429763793945},{"id":"https://openalex.org/keywords/routing","display_name":"Routing (electronic design automation)","score":0.6109474897384644},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4631494879722595},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.40053433179855347},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.3968152701854706},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3709365725517273},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3438708782196045},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.2516784071922302}],"concepts":[{"id":"https://openalex.org/C22019652","wikidata":"https://www.wikidata.org/wiki/Q331309","display_name":"Overfitting","level":3,"score":0.8182542324066162},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7360429763793945},{"id":"https://openalex.org/C74172769","wikidata":"https://www.wikidata.org/wiki/Q1446839","display_name":"Routing (electronic design automation)","level":2,"score":0.6109474897384644},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4631494879722595},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.40053433179855347},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.3968152701854706},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3709365725517273},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3438708782196045},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.2516784071922302},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.23919/eusipco.2018.8553198","is_oa":false,"landing_page_url":"https://doi.org/10.23919/eusipco.2018.8553198","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 26th European Signal Processing Conference (EUSIPCO)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Life in Land","score":0.5400000214576721,"id":"https://metadata.un.org/sdg/15"}],"awards":[{"id":"https://openalex.org/G4971557284","display_name":null,"funder_award_id":"1976218","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"}],"funders":[{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":43,"referenced_works":["https://openalex.org/W2966661","https://openalex.org/W1514535095","https://openalex.org/W1522301498","https://openalex.org/W1665214252","https://openalex.org/W1836465849","https://openalex.org/W1904365287","https://openalex.org/W2008415856","https://openalex.org/W2086384421","https://openalex.org/W2095705004","https://openalex.org/W2103235956","https://openalex.org/W2108598243","https://openalex.org/W2112796928","https://openalex.org/W2131774270","https://openalex.org/W2133564696","https://openalex.org/W2408239454","https://openalex.org/W2567070169","https://openalex.org/W2591013610","https://openalex.org/W2604490051","https://openalex.org/W2735072998","https://openalex.org/W2757154355","https://openalex.org/W2758870122","https://openalex.org/W2759176740","https://openalex.org/W2760098415","https://openalex.org/W2775505379","https://openalex.org/W2775794021","https://openalex.org/W2785994986","https://openalex.org/W2797472209","https://openalex.org/W2949117887","https://openalex.org/W2963703618","https://openalex.org/W2963723765","https://openalex.org/W2963970792","https://openalex.org/W2964121744","https://openalex.org/W2964308564","https://openalex.org/W6630875275","https://openalex.org/W6631190155","https://openalex.org/W6637242042","https://openalex.org/W6638667902","https://openalex.org/W6674330103","https://openalex.org/W6679434410","https://openalex.org/W6731370813","https://openalex.org/W6743446608","https://openalex.org/W6747331233","https://openalex.org/W6748053814"],"related_works":["https://openalex.org/W4362597605","https://openalex.org/W1574414179","https://openalex.org/W4297676672","https://openalex.org/W3009056573","https://openalex.org/W2922073769","https://openalex.org/W4281702477","https://openalex.org/W2490526372","https://openalex.org/W4376166922","https://openalex.org/W4378510483","https://openalex.org/W2885665929"],"abstract_inverted_index":{"The":[0],"detection":[1],"of":[2,57,63,68,73,102,134,149],"acoustic":[3],"scenes":[4],"is":[5,54,75,89,129,144,154],"a":[6,18,41,55,61,84,94,114],"challenging":[7],"problem":[8,39],"in":[9,86,96,100],"which":[10],"environmental":[11],"sound":[12],"events":[13,26],"must":[14],"be":[15],"detected":[16],"from":[17],"given":[19],"audio":[20],"signal.":[21],"This":[22],"includes":[23],"classifying":[24],"the":[25,47,71,97,103,135],"as":[27,29],"well":[28],"estimating":[30],"their":[31],"onset":[32],"and":[33,70],"offset":[34],"times.":[35],"We":[36],"approach":[37],"this":[38],"with":[40],"neural":[42],"network":[43,115],"architecture":[44],"that":[45,116,141],"uses":[46],"recently-proposed":[48],"capsule":[49,53,85,95,108],"routing":[50,74],"mechanism.":[51],"A":[52],"group":[56],"activation":[58],"units":[59],"representing":[60],"set":[62],"properties":[64],"for":[65],"an":[66,147],"entity":[67,104],"interest,":[69],"purpose":[72],"to":[76,91,93,112,158],"identify":[77],"part-whole":[78],"relationships":[79],"between":[80],"capsules.":[81],"That":[82],"is,":[83],"one":[87],"layer":[88,98],"assumed":[90],"belong":[92],"above":[99],"terms":[101],"being":[105],"represented.":[106],"Using":[107],"routing,":[109],"we":[110],"wish":[111],"train":[113],"can":[117],"learn":[118],"global":[119],"coherence":[120],"implicitly,":[121],"thereby":[122],"improving":[123],"generalization":[124],"performance.":[125],"Our":[126],"proposed":[127],"method":[128],"evaluated":[130],"on":[131],"Task":[132],"4":[133],"DCASE":[136],"2017":[137],"challenge.":[138],"Results":[139],"show":[140],"classification":[142],"performance":[143],"state-of-the-art,":[145],"achieving":[146],"F-score":[148],"58.6%.":[150],"In":[151],"addition,":[152],"overfitting":[153],"reduced":[155],"considerably":[156],"compared":[157],"other":[159],"architectures.":[160]},"counts_by_year":[{"year":2025,"cited_by_count":4},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":9},{"year":2020,"cited_by_count":11},{"year":2019,"cited_by_count":5},{"year":2018,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
