{"id":"https://openalex.org/W2799258971","doi":"https://doi.org/10.1109/taslp.2018.2858559","title":"Adaptive Pooling Operators for Weakly Labeled Sound Event Detection","display_name":"Adaptive Pooling Operators for Weakly Labeled Sound Event Detection","publication_year":2018,"publication_date":"2018-08-13","ids":{"openalex":"https://openalex.org/W2799258971","doi":"https://doi.org/10.1109/taslp.2018.2858559","mag":"2799258971"},"language":"en","primary_location":{"id":"doi:10.1109/taslp.2018.2858559","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2018.2858559","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5010404092","display_name":"Brian McFee","orcid":"https://orcid.org/0000-0001-6261-9747"},"institutions":[{"id":"https://openalex.org/I57206974","display_name":"New York University","ror":"https://ror.org/0190ak572","country_code":"US","type":"education","lineage":["https://openalex.org/I57206974"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Brian McFee","raw_affiliation_strings":["Music and Audio Research Laboratory and the Center for Data Science, New York University, New York, NY, USA"],"affiliations":[{"raw_affiliation_string":"Music and Audio Research Laboratory and the Center for Data Science, New York University, New York, NY, USA","institution_ids":["https://openalex.org/I57206974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037548450","display_name":"Justin Salamon","orcid":"https://orcid.org/0000-0001-6345-4593"},"institutions":[{"id":"https://openalex.org/I174216632","display_name":"City University of New York","ror":"https://ror.org/00453a208","country_code":"US","type":"education","lineage":["https://openalex.org/I174216632"]},{"id":"https://openalex.org/I57206974","display_name":"New York University","ror":"https://ror.org/0190ak572","country_code":"US","type":"education","lineage":["https://openalex.org/I57206974"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Justin Salamon","raw_affiliation_strings":["Center for Urban Science and Progress, New York University, Brooklyn, NY, USA"],"affiliations":[{"raw_affiliation_string":"Center for Urban Science and Progress, New York University, Brooklyn, NY, USA","institution_ids":["https://openalex.org/I174216632","https://openalex.org/I57206974"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5031398497","display_name":"Juan Pablo Bello","orcid":"https://orcid.org/0000-0001-8561-5204"},"institutions":[{"id":"https://openalex.org/I57206974","display_name":"New York University","ror":"https://ror.org/0190ak572","country_code":"US","type":"education","lineage":["https://openalex.org/I57206974"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Juan Pablo Bello","raw_affiliation_strings":["Music and Audio Research Laboratory, New York University, New York, NY, USA"],"affiliations":[{"raw_affiliation_string":"Music and Audio Research Laboratory, New York University, New York, NY, USA","institution_ids":["https://openalex.org/I57206974"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5010404092"],"corresponding_institution_ids":["https://openalex.org/I57206974"],"apc_list":null,"apc_paid":null,"fwci":17.5762,"has_fulltext":false,"cited_by_count":162,"citation_normalized_percentile":{"value":0.99499285,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":"26","issue":"11","first_page":"2180","last_page":"2193"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.9861000180244446,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pooling","display_name":"Pooling","score":0.9273760318756104},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7626823782920837},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.582539975643158},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.5301709175109863},{"id":"https://openalex.org/keywords/event","display_name":"Event (particle physics)","score":0.5226309299468994},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.500075101852417},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.48747730255126953},{"id":"https://openalex.org/keywords/locality","display_name":"Locality","score":0.4590436816215515},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.36697980761528015}],"concepts":[{"id":"https://openalex.org/C70437156","wikidata":"https://www.wikidata.org/wiki/Q7228652","display_name":"Pooling","level":2,"score":0.9273760318756104},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7626823782920837},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.582539975643158},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.5301709175109863},{"id":"https://openalex.org/C2779662365","wikidata":"https://www.wikidata.org/wiki/Q5416694","display_name":"Event (particle physics)","level":2,"score":0.5226309299468994},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.500075101852417},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.48747730255126953},{"id":"https://openalex.org/C2779808786","wikidata":"https://www.wikidata.org/wiki/Q6664603","display_name":"Locality","level":2,"score":0.4590436816215515},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.36697980761528015},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/taslp.2018.2858559","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2018.2858559","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Decent work and economic growth","score":0.7699999809265137,"id":"https://metadata.un.org/sdg/8"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320309480","display_name":"Nvidia","ror":"https://ror.org/03jdj4y14"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":103,"referenced_works":["https://openalex.org/W821549425","https://openalex.org/W1511170870","https://openalex.org/W1522301498","https://openalex.org/W1533561824","https://openalex.org/W1565746575","https://openalex.org/W1568645074","https://openalex.org/W1622490909","https://openalex.org/W1650531274","https://openalex.org/W1836465849","https://openalex.org/W1844944916","https://openalex.org/W1961429348","https://openalex.org/W1974758710","https://openalex.org/W2011972438","https://openalex.org/W2013556148","https://openalex.org/W2034215399","https://openalex.org/W2038484192","https://openalex.org/W2061351061","https://openalex.org/W2077159900","https://openalex.org/W2083488428","https://openalex.org/W2090200552","https://openalex.org/W2098166271","https://openalex.org/W2102381657","https://openalex.org/W2108745803","https://openalex.org/W2110119381","https://openalex.org/W2121044470","https://openalex.org/W2123843894","https://openalex.org/W2126109423","https://openalex.org/W2133564696","https://openalex.org/W2135342008","https://openalex.org/W2135533176","https://openalex.org/W2140013053","https://openalex.org/W2147917435","https://openalex.org/W2166010828","https://openalex.org/W2198082746","https://openalex.org/W2201092681","https://openalex.org/W2222844749","https://openalex.org/W2232894815","https://openalex.org/W2296724634","https://openalex.org/W2341412280","https://openalex.org/W2354870669","https://openalex.org/W2398243923","https://openalex.org/W2402144811","https://openalex.org/W2407542046","https://openalex.org/W2408239454","https://openalex.org/W2477915622","https://openalex.org/W2526050071","https://openalex.org/W2529483679","https://openalex.org/W2552032035","https://openalex.org/W2553581788","https://openalex.org/W2565911560","https://openalex.org/W2591013610","https://openalex.org/W2593116425","https://openalex.org/W2604465723","https://openalex.org/W2618269622","https://openalex.org/W2619697695","https://openalex.org/W2654517624","https://openalex.org/W2757154355","https://openalex.org/W2763971240","https://openalex.org/W2771361008","https://openalex.org/W2775505379","https://openalex.org/W2798193689","https://openalex.org/W2798350598","https://openalex.org/W2890012819","https://openalex.org/W2953384591","https://openalex.org/W2962910554","https://openalex.org/W2963099423","https://openalex.org/W2963723765","https://openalex.org/W2964121744","https://openalex.org/W2964136284","https://openalex.org/W2964308564","https://openalex.org/W3209800560","https://openalex.org/W3210064060","https://openalex.org/W4294620492","https://openalex.org/W4387533596","https://openalex.org/W6631190155","https://openalex.org/W6632323398","https://openalex.org/W6636517600","https://openalex.org/W6638667902","https://openalex.org/W6666040507","https://openalex.org/W6676245398","https://openalex.org/W6678230397","https://openalex.org/W6679434410","https://openalex.org/W6680102115","https://openalex.org/W6680873201","https://openalex.org/W6684369376","https://openalex.org/W6687511127","https://openalex.org/W6687630728","https://openalex.org/W6689149156","https://openalex.org/W6696126599","https://openalex.org/W6697040288","https://openalex.org/W6706051827","https://openalex.org/W6712594816","https://openalex.org/W6713134421","https://openalex.org/W6721490382","https://openalex.org/W6745117180","https://openalex.org/W6745214240","https://openalex.org/W6745928684","https://openalex.org/W6745952243","https://openalex.org/W6747331233","https://openalex.org/W6750169387","https://openalex.org/W6750533491","https://openalex.org/W6753803210","https://openalex.org/W6803424631"],"related_works":["https://openalex.org/W2517027266","https://openalex.org/W2424871898","https://openalex.org/W2291847203","https://openalex.org/W3004532561","https://openalex.org/W4287776258","https://openalex.org/W2756241593","https://openalex.org/W3027997911","https://openalex.org/W2767651786","https://openalex.org/W2944724518","https://openalex.org/W3021430260"],"abstract_inverted_index":{"Sound":[0],"event":[1],"detection":[2],"(SED)":[3],"methods":[4,189,242],"are":[5,55,89,243],"tasked":[6],"with":[7,205,216],"labeling":[8],"segments":[9],"of":[10,16,38,52,70,100,137,166,202],"audio":[11],"recordings":[12],"by":[13],"the":[14,34,47,67,96,164,167,174,187,200,240],"presence":[15,35,97],"active":[17],"sound":[18,40,101,168],"sources.":[19],"SED":[20,71,78,238],"is":[21,212],"typically":[22],"posed":[23],"as":[24,79,144,155],"a":[25,80,92,135],"supervised":[26],"machine":[27],"learning":[28,83],"problem,":[29,85],"requiring":[30],"strong":[31,50],"annotations":[32,51],"for":[33,60,194,229],"or":[36,98,158],"absence":[37,99],"each":[39,185],"source":[41],"at":[42],"every":[43],"time":[44],"instant":[45],"within":[46],"recording.":[48],"However,":[49],"this":[53,74,131,234],"type":[54],"both":[56],"labor-":[57],"and":[58,160,181,197,245],"cost-intensive":[59],"human":[61],"annotators":[62],"to":[63,143,163,225,250],"produce,":[64],"which":[65,117,147],"limits":[66],"practical":[68],"scalability":[69],"methods.":[72],"In":[73],"paper,":[75],"we":[76,133],"treat":[77],"multiple":[81],"instance":[82],"(MIL)":[84],"where":[86],"training":[87],"labels":[88,126],"static":[90,125,195],"over":[91],"short":[93],"excerpt,":[94],"indicating":[95],"sources":[102,169],"but":[103,220],"not":[104],"their":[105],"temporal":[106],"locality.":[107],"The":[108,209],"models,":[109],"however,":[110],"must":[111,118],"still":[112],"produce":[113],"temporally":[114],"dynamic":[115,207],"predictions,":[116],"be":[119,222,247],"aggregated":[120],"(pooled)":[121],"when":[122],"comparing":[123],"against":[124],"during":[127],"training.":[128],"To":[129],"facilitate":[130],"aggregation,":[132],"develop":[134],"family":[136],"adaptive":[138],"pooling":[139,152,176,192],"operators":[140,177,193],"-":[141,146],"referred":[142],"autopool":[145],"smoothly":[148],"interpolate":[149],"between":[150],"common":[151],"operators,":[153],"such":[154],"min-,":[156],"max-,":[157],"average-pooling,":[159],"automatically":[161],"adapt":[162],"characteristics":[165],"in":[170,184,214,253],"question.":[171],"We":[172],"evaluate":[173],"proposed":[175,188,210,241],"on":[178,237],"three":[179],"datasets,":[180],"demonstrate":[182],"that":[183],"case,":[186],"outperform":[190],"nonadaptive":[191],"prediction,":[196],"nearly":[198],"match":[199],"performance":[201],"models":[203],"trained":[204],"strong,":[206],"annotations.":[208],"method":[211],"evaluated":[213],"conjunction":[215],"convolutional":[217],"neural":[218],"networks,":[219],"can":[221],"readily":[223],"applied":[224,248],"any":[226,254],"differentiable":[227],"model":[228],"time-series":[230],"label":[231],"prediction.":[232],"While":[233],"paper":[235],"focuses":[236],"applications,":[239],"general,":[244],"could":[246],"widely":[249],"MIL":[251],"problems":[252],"domain.":[255]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":10},{"year":2024,"cited_by_count":12},{"year":2023,"cited_by_count":9},{"year":2022,"cited_by_count":24},{"year":2021,"cited_by_count":41},{"year":2020,"cited_by_count":41},{"year":2019,"cited_by_count":22},{"year":2018,"cited_by_count":2}],"updated_date":"2026-04-13T07:58:08.660418","created_date":"2025-10-10T00:00:00"}
