{"id":"https://openalex.org/W2040940879","doi":"https://doi.org/10.1109/icassp.2014.6853982","title":"Multi-resolution linear prediction based features for audio onset detection with bidirectional LSTM neural networks","display_name":"Multi-resolution linear prediction based features for audio onset detection with bidirectional LSTM neural networks","publication_year":2014,"publication_date":"2014-05-01","ids":{"openalex":"https://openalex.org/W2040940879","doi":"https://doi.org/10.1109/icassp.2014.6853982","mag":"2040940879"},"language":"en","primary_location":{"id":"doi:10.1109/icassp.2014.6853982","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2014.6853982","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://opus.bibliothek.uni-augsburg.de/opus4/files/72576/72576.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5009327522","display_name":"Erik Marchi","orcid":"https://orcid.org/0000-0002-5335-6356"},"institutions":[{"id":"https://openalex.org/I4210121626","display_name":"Signal Processing (United States)","ror":"https://ror.org/021gzyw51","country_code":"US","type":"company","lineage":["https://openalex.org/I4210121626"]},{"id":"https://openalex.org/I4210094487","display_name":"Intel (Germany)","ror":"https://ror.org/00m2x0g47","country_code":"DE","type":"company","lineage":["https://openalex.org/I1343180700","https://openalex.org/I4210094487"]},{"id":"https://openalex.org/I62916508","display_name":"Technical University of Munich","ror":"https://ror.org/02kkvpp62","country_code":"DE","type":"education","lineage":["https://openalex.org/I62916508"]}],"countries":["DE","US"],"is_corresponding":true,"raw_author_name":"Erik Marchi","raw_affiliation_strings":["Machine Intelligence & Signal Processing Group, Technische Universit\u00e4t M\u00fcnchen, GERMANY","Machine Intell. & Signal Process. Group, Tech. Univ. Munchen, Mu\u0308nchen, Germany"],"affiliations":[{"raw_affiliation_string":"Machine Intelligence & Signal Processing Group, Technische Universit\u00e4t M\u00fcnchen, GERMANY","institution_ids":["https://openalex.org/I62916508","https://openalex.org/I4210121626"]},{"raw_affiliation_string":"Machine Intell. & Signal Process. Group, Tech. Univ. Munchen, Mu\u0308nchen, Germany","institution_ids":["https://openalex.org/I62916508","https://openalex.org/I4210094487"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013662216","display_name":"Giacomo Ferroni","orcid":null},"institutions":[{"id":"https://openalex.org/I122534668","display_name":"Marche Polytechnic University","ror":"https://ror.org/00x69rs40","country_code":"IT","type":"education","lineage":["https://openalex.org/I122534668"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Giacomo Ferroni","raw_affiliation_strings":["A3LAB, Universit\u00e0 Politecnica delle Marche, ITALY","Dept. of Inf. Eng., Univ. Politec. delle Marche, Ancona, Italy"],"affiliations":[{"raw_affiliation_string":"A3LAB, Universit\u00e0 Politecnica delle Marche, ITALY","institution_ids":["https://openalex.org/I122534668"]},{"raw_affiliation_string":"Dept. of Inf. Eng., Univ. Politec. delle Marche, Ancona, Italy","institution_ids":["https://openalex.org/I122534668"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023264395","display_name":"Florian Eyben","orcid":null},"institutions":[{"id":"https://openalex.org/I62916508","display_name":"Technical University of Munich","ror":"https://ror.org/02kkvpp62","country_code":"DE","type":"education","lineage":["https://openalex.org/I62916508"]},{"id":"https://openalex.org/I4210094487","display_name":"Intel (Germany)","ror":"https://ror.org/00m2x0g47","country_code":"DE","type":"company","lineage":["https://openalex.org/I1343180700","https://openalex.org/I4210094487"]},{"id":"https://openalex.org/I4210121626","display_name":"Signal Processing (United States)","ror":"https://ror.org/021gzyw51","country_code":"US","type":"company","lineage":["https://openalex.org/I4210121626"]}],"countries":["DE","US"],"is_corresponding":false,"raw_author_name":"Florian Eyben","raw_affiliation_strings":["Machine Intelligence & Signal Processing Group, Technische Universit\u00e4t M\u00fcnchen, GERMANY","Machine Intell. & Signal Process. Group, Tech. Univ. Munchen, Mu\u0308nchen, Germany"],"affiliations":[{"raw_affiliation_string":"Machine Intelligence & Signal Processing Group, Technische Universit\u00e4t M\u00fcnchen, GERMANY","institution_ids":["https://openalex.org/I62916508","https://openalex.org/I4210121626"]},{"raw_affiliation_string":"Machine Intell. & Signal Process. Group, Tech. Univ. Munchen, Mu\u0308nchen, Germany","institution_ids":["https://openalex.org/I62916508","https://openalex.org/I4210094487"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061023296","display_name":"Leonardo Gabrielli","orcid":"https://orcid.org/0000-0002-3812-0900"},"institutions":[{"id":"https://openalex.org/I122534668","display_name":"Marche Polytechnic University","ror":"https://ror.org/00x69rs40","country_code":"IT","type":"education","lineage":["https://openalex.org/I122534668"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Leonardo Gabrielli","raw_affiliation_strings":["A3LAB, Universit\u00e0 Politecnica delle Marche, ITALY","Dept. of Inf. Eng., Univ. Politec. delle Marche, Ancona, Italy"],"affiliations":[{"raw_affiliation_string":"A3LAB, Universit\u00e0 Politecnica delle Marche, ITALY","institution_ids":["https://openalex.org/I122534668"]},{"raw_affiliation_string":"Dept. of Inf. Eng., Univ. Politec. delle Marche, Ancona, Italy","institution_ids":["https://openalex.org/I122534668"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034253968","display_name":"Stefano Squartini","orcid":"https://orcid.org/0000-0001-9374-0128"},"institutions":[{"id":"https://openalex.org/I122534668","display_name":"Marche Polytechnic University","ror":"https://ror.org/00x69rs40","country_code":"IT","type":"education","lineage":["https://openalex.org/I122534668"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Stefano Squartini","raw_affiliation_strings":["A3LAB, Universit\u00e0 Politecnica delle Marche, ITALY","Dept. of Inf. Eng., Univ. Politec. delle Marche, Ancona, Italy"],"affiliations":[{"raw_affiliation_string":"A3LAB, Universit\u00e0 Politecnica delle Marche, ITALY","institution_ids":["https://openalex.org/I122534668"]},{"raw_affiliation_string":"Dept. of Inf. Eng., Univ. Politec. delle Marche, Ancona, Italy","institution_ids":["https://openalex.org/I122534668"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5043060302","display_name":"Bj\u00f6rn W. Schuller","orcid":"https://orcid.org/0000-0002-6478-8699"},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]},{"id":"https://openalex.org/I62916508","display_name":"Technical University of Munich","ror":"https://ror.org/02kkvpp62","country_code":"DE","type":"education","lineage":["https://openalex.org/I62916508"]},{"id":"https://openalex.org/I4210121626","display_name":"Signal Processing (United States)","ror":"https://ror.org/021gzyw51","country_code":"US","type":"company","lineage":["https://openalex.org/I4210121626"]}],"countries":["DE","GB","US"],"is_corresponding":false,"raw_author_name":"Bjorn Schuller","raw_affiliation_strings":["Machine Intelligence & Signal Processing Group, Technische Universit\u00e4t M\u00fcnchen, GERMANY","Dept. of Comput., Imperial Coll. London, London, UK"],"affiliations":[{"raw_affiliation_string":"Machine Intelligence & Signal Processing Group, Technische Universit\u00e4t M\u00fcnchen, GERMANY","institution_ids":["https://openalex.org/I62916508","https://openalex.org/I4210121626"]},{"raw_affiliation_string":"Dept. of Comput., Imperial Coll. London, London, UK","institution_ids":["https://openalex.org/I47508984"]}]}],"institutions":[],"countries_distinct_count":4,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5009327522"],"corresponding_institution_ids":["https://openalex.org/I4210094487","https://openalex.org/I4210121626","https://openalex.org/I62916508"],"apc_list":null,"apc_paid":null,"fwci":7.2783,"has_fulltext":false,"cited_by_count":91,"citation_normalized_percentile":{"value":0.97771991,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"2164","last_page":"2168"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9944999814033508,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.9944000244140625,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7902672290802002},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5340852737426758},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5333298444747925},{"id":"https://openalex.org/keywords/wavelet","display_name":"Wavelet","score":0.49609479308128357},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4953557252883911},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.464780330657959},{"id":"https://openalex.org/keywords/linear-prediction","display_name":"Linear prediction","score":0.4355812072753906},{"id":"https://openalex.org/keywords/term","display_name":"Term (time)","score":0.4237768054008484},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3208395838737488}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7902672290802002},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5340852737426758},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5333298444747925},{"id":"https://openalex.org/C47432892","wikidata":"https://www.wikidata.org/wiki/Q831390","display_name":"Wavelet","level":2,"score":0.49609479308128357},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4953557252883911},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.464780330657959},{"id":"https://openalex.org/C131109320","wikidata":"https://www.wikidata.org/wiki/Q581012","display_name":"Linear prediction","level":2,"score":0.4355812072753906},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.4237768054008484},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3208395838737488},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/icassp.2014.6853982","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2014.6853982","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},{"id":"pmh:oai:uni-augsburg.opus-bayern.de:72576","is_oa":true,"landing_page_url":"https://nbn-resolving.org/urn:nbn:de:bvb:384-opus4-725762","pdf_url":"https://opus.bibliothek.uni-augsburg.de/opus4/files/72576/72576.pdf","source":{"id":"https://openalex.org/S4306400930","display_name":"OPUS (Augsburg University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I119916105","host_organization_name":"Augsburg University","host_organization_lineage":["https://openalex.org/I119916105"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"bookpart"},{"id":"pmh:oai:iris.univpm.it:11566/153904","is_oa":false,"landing_page_url":"http://hdl.handle.net/11566/153904","pdf_url":null,"source":{"id":"https://openalex.org/S4306402571","display_name":"Universit\u00e0 Politecnica delle Marche (Universit\u00e0 Politecnica delle Marche)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I122534668","host_organization_name":"Marche Polytechnic University","host_organization_lineage":["https://openalex.org/I122534668"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/conferenceObject"}],"best_oa_location":{"id":"pmh:oai:uni-augsburg.opus-bayern.de:72576","is_oa":true,"landing_page_url":"https://nbn-resolving.org/urn:nbn:de:bvb:384-opus4-725762","pdf_url":"https://opus.bibliothek.uni-augsburg.de/opus4/files/72576/72576.pdf","source":{"id":"https://openalex.org/S4306400930","display_name":"OPUS (Augsburg University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I119916105","host_organization_name":"Augsburg University","host_organization_lineage":["https://openalex.org/I119916105"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"bookpart"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2040940879.pdf","grobid_xml":"https://content.openalex.org/works/W2040940879.grobid-xml"},"referenced_works_count":32,"referenced_works":["https://openalex.org/W1492221128","https://openalex.org/W1598214593","https://openalex.org/W1990190154","https://openalex.org/W2057587042","https://openalex.org/W2064675550","https://openalex.org/W2084883122","https://openalex.org/W2090438737","https://openalex.org/W2098580349","https://openalex.org/W2103727353","https://openalex.org/W2105143211","https://openalex.org/W2114537739","https://openalex.org/W2120132744","https://openalex.org/W2127947624","https://openalex.org/W2131963441","https://openalex.org/W2133240958","https://openalex.org/W2139238328","https://openalex.org/W2140304104","https://openalex.org/W2142967796","https://openalex.org/W2148770797","https://openalex.org/W2152429995","https://openalex.org/W2159433418","https://openalex.org/W2293202270","https://openalex.org/W2397818963","https://openalex.org/W2402539476","https://openalex.org/W2598144628","https://openalex.org/W2745066247","https://openalex.org/W3113172960","https://openalex.org/W6635681657","https://openalex.org/W6674927801","https://openalex.org/W6697171384","https://openalex.org/W6713054120","https://openalex.org/W6742531275"],"related_works":["https://openalex.org/W2382174632","https://openalex.org/W2129959498","https://openalex.org/W2784060934","https://openalex.org/W2902714807","https://openalex.org/W2537489131","https://openalex.org/W2129377384","https://openalex.org/W2362031592","https://openalex.org/W2356580463","https://openalex.org/W3133960409","https://openalex.org/W86066796"],"abstract_inverted_index":{"A":[0],"plethora":[1],"of":[2,34,64,111,150,160],"different":[3,32,68],"onset":[4,65,112,118],"detection":[5,66],"methods":[6,125,147],"have":[7,17],"been":[8,18],"proposed":[9],"in":[10,25,67,148],"the":[11],"recent":[12],"years.":[13],"However,":[14],"few":[15],"attempts":[16],"made":[19],"with":[20,37,82,107,123],"respect":[21],"to":[22,27],"widely-applicable":[23],"approaches":[24],"order":[26],"achieve":[28],"superior":[29],"performances":[30],"over":[31],"types":[33],"music":[35,156],"and":[36,54,62,76,86,117,133,138],"considerable":[38],"temporal":[39],"precision.":[40],"In":[41,71],"this":[42],"paper,":[43],"we":[44,139],"present":[45],"a":[46,90,108,127],"multi-resolution":[47],"approach":[48,143],"based":[49],"on":[50,126],"discrete":[51],"wavelet":[52,74],"transform":[53],"linear":[55],"prediction":[56,78],"filtering":[57],"that":[58,129,141],"improves":[59],"time":[60],"resolution":[61],"performance":[63],"musical":[69],"scenarios.":[70],"our":[72,142],"approach,":[73],"coefficients":[75],"forward":[77],"errors":[79],"are":[80],"combined":[81],"auditory":[83],"spectral":[84],"features":[85],"then":[87],"processed":[88],"by":[89],"bidirectional":[91],"Long":[92],"Short-Term":[93],"Memory":[94],"recurrent":[95],"neural":[96],"network,":[97],"which":[98],"acts":[99],"as":[100],"reduction":[101],"function.":[102],"The":[103],"network":[104],"is":[105,162],"trained":[106],"large":[109],"database":[110],"data":[113],"covering":[114],"various":[115],"genres":[116],"types.":[119],"We":[120],"compare":[121],"results":[122],"state-of-the-art":[124],"dataset":[128],"includes":[130],"Bello,":[131],"Glover":[132],"ISMIR":[134],"2004":[135],"Ballroom":[136],"sets,":[137],"conclude":[140],"significantly":[144],"outperforms":[145],"existing":[146],"terms":[149],"F-Measure.":[151],"For":[152],"pitched":[153],"non":[154],"percussive":[155],"an":[157],"absolute":[158],"improvement":[159],"7.5%":[161],"reported.":[163]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":6},{"year":2021,"cited_by_count":9},{"year":2020,"cited_by_count":9},{"year":2019,"cited_by_count":18},{"year":2018,"cited_by_count":14},{"year":2017,"cited_by_count":8},{"year":2016,"cited_by_count":6},{"year":2015,"cited_by_count":10},{"year":2014,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
