{"id":"https://openalex.org/W2751958095","doi":"https://doi.org/10.23919/eusipco.2018.8553106","title":"A Comparison of Audio Signal Preprocessing Methods for Deep Neural Networks on Music Tagging","display_name":"A Comparison of Audio Signal Preprocessing Methods for Deep Neural Networks on Music Tagging","publication_year":2018,"publication_date":"2018-09-01","ids":{"openalex":"https://openalex.org/W2751958095","doi":"https://doi.org/10.23919/eusipco.2018.8553106","mag":"2751958095"},"language":"en","primary_location":{"id":"doi:10.23919/eusipco.2018.8553106","is_oa":false,"landing_page_url":"https://doi.org/10.23919/eusipco.2018.8553106","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 26th European Signal Processing Conference (EUSIPCO)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1709.01922","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5011038627","display_name":"Keunwoo Choi","orcid":"https://orcid.org/0000-0002-5305-5342"},"institutions":[{"id":"https://openalex.org/I166337079","display_name":"Queen Mary University of London","ror":"https://ror.org/026zzn846","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I166337079"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Keunwoo Choi","raw_affiliation_strings":["Queen Mary University of London, London, UK, Centre for Digital Music, EECS E1 4FZ, London, UK"],"affiliations":[{"raw_affiliation_string":"Queen Mary University of London, London, UK, Centre for Digital Music, EECS E1 4FZ, London, UK","institution_ids":["https://openalex.org/I166337079"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032485940","display_name":"Gy\u00f6rgy Fazekas","orcid":null},"institutions":[{"id":"https://openalex.org/I166337079","display_name":"Queen Mary University of London","ror":"https://ror.org/026zzn846","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I166337079"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Gyorgy Fazekas","raw_affiliation_strings":["Queen Mary University of London, London, UK, Centre for Digital Music, EECS E1 4FZ, London, UK"],"affiliations":[{"raw_affiliation_string":"Queen Mary University of London, London, UK, Centre for Digital Music, EECS E1 4FZ, London, UK","institution_ids":["https://openalex.org/I166337079"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076173089","display_name":"M. Sandler","orcid":"https://orcid.org/0000-0002-5691-8107"},"institutions":[{"id":"https://openalex.org/I166337079","display_name":"Queen Mary University of London","ror":"https://ror.org/026zzn846","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I166337079"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Mark Sandler","raw_affiliation_strings":["Queen Mary University of London, London, UK, Centre for Digital Music, EECS E1 4FZ, London, UK"],"affiliations":[{"raw_affiliation_string":"Queen Mary University of London, London, UK, Centre for Digital Music, EECS E1 4FZ, London, UK","institution_ids":["https://openalex.org/I166337079"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5091175785","display_name":"Kyunghyun Cho","orcid":"https://orcid.org/0000-0003-1669-3211"},"institutions":[{"id":"https://openalex.org/I57206974","display_name":"New York University","ror":"https://ror.org/0190ak572","country_code":"US","type":"education","lineage":["https://openalex.org/I57206974"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kyunghyun Cho","raw_affiliation_strings":["New York University, NY, USA, Center for Data Science 715 Broadway, New York, NY, USA"],"affiliations":[{"raw_affiliation_string":"New York University, NY, USA, Center for Data Science 715 Broadway, New York, NY, USA","institution_ids":["https://openalex.org/I57206974"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5011038627"],"corresponding_institution_ids":["https://openalex.org/I166337079"],"apc_list":null,"apc_paid":null,"fwci":0.9958,"has_fulltext":true,"cited_by_count":12,"citation_normalized_percentile":{"value":0.7544203,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1870","last_page":"1874"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/preprocessor","display_name":"Preprocessor","score":0.8369814157485962},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7446131706237793},{"id":"https://openalex.org/keywords/weighting","display_name":"Weighting","score":0.6670000553131104},{"id":"https://openalex.org/keywords/logarithm","display_name":"Logarithm","score":0.6061344146728516},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5865734815597534},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5822006464004517},{"id":"https://openalex.org/keywords/audio-signal","display_name":"Audio signal","score":0.4893321394920349},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4845832586288452},{"id":"https://openalex.org/keywords/signal","display_name":"SIGNAL (programming language)","score":0.4787689745426178},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.46987587213516235},{"id":"https://openalex.org/keywords/signal-processing","display_name":"Signal processing","score":0.4400373101234436},{"id":"https://openalex.org/keywords/deep-neural-networks","display_name":"Deep neural networks","score":0.429246187210083},{"id":"https://openalex.org/keywords/speech-coding","display_name":"Speech coding","score":0.15199583768844604},{"id":"https://openalex.org/keywords/digital-signal-processing","display_name":"Digital signal processing","score":0.12977847456932068},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1092727780342102},{"id":"https://openalex.org/keywords/acoustics","display_name":"Acoustics","score":0.0971333384513855}],"concepts":[{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.8369814157485962},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7446131706237793},{"id":"https://openalex.org/C183115368","wikidata":"https://www.wikidata.org/wiki/Q856577","display_name":"Weighting","level":2,"score":0.6670000553131104},{"id":"https://openalex.org/C39927690","wikidata":"https://www.wikidata.org/wiki/Q11197","display_name":"Logarithm","level":2,"score":0.6061344146728516},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5865734815597534},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5822006464004517},{"id":"https://openalex.org/C64922751","wikidata":"https://www.wikidata.org/wiki/Q4650799","display_name":"Audio signal","level":3,"score":0.4893321394920349},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4845832586288452},{"id":"https://openalex.org/C2779843651","wikidata":"https://www.wikidata.org/wiki/Q7390335","display_name":"SIGNAL (programming language)","level":2,"score":0.4787689745426178},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.46987587213516235},{"id":"https://openalex.org/C104267543","wikidata":"https://www.wikidata.org/wiki/Q208163","display_name":"Signal processing","level":3,"score":0.4400373101234436},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.429246187210083},{"id":"https://openalex.org/C13895895","wikidata":"https://www.wikidata.org/wiki/Q3270773","display_name":"Speech coding","level":2,"score":0.15199583768844604},{"id":"https://openalex.org/C84462506","wikidata":"https://www.wikidata.org/wiki/Q173142","display_name":"Digital signal processing","level":2,"score":0.12977847456932068},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1092727780342102},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.0971333384513855},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":5,"locations":[{"id":"doi:10.23919/eusipco.2018.8553106","is_oa":false,"landing_page_url":"https://doi.org/10.23919/eusipco.2018.8553106","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 26th European Signal Processing Conference (EUSIPCO)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1709.01922","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1709.01922","pdf_url":"https://arxiv.org/pdf/1709.01922","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"mag:2751958095","is_oa":true,"landing_page_url":"https://arxiv.org/pdf/1709.01922","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"pmh:oai:qmro.qmul.ac.uk:123456789/68127","is_oa":false,"landing_page_url":"https://qmro.qmul.ac.uk/xmlui/handle/123456789/68127","pdf_url":null,"source":{"id":"https://openalex.org/S4306400530","display_name":"Queen Mary Research Online (Queen Mary University of London)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I166337079","host_organization_name":"Queen Mary University of London","host_organization_lineage":["https://openalex.org/I166337079"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Conference Proceeding"},{"id":"doi:10.48550/arxiv.1709.01922","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1709.01922","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:1709.01922","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1709.01922","pdf_url":"https://arxiv.org/pdf/1709.01922","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G8217561489","display_name":null,"funder_award_id":"EP/L019981/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"}],"funders":[{"id":"https://openalex.org/F4320309480","display_name":"Nvidia","ror":"https://ror.org/03jdj4y14"},{"id":"https://openalex.org/F4320320300","display_name":"European Commission","ror":"https://ror.org/00k4n6c32"},{"id":"https://openalex.org/F4320332999","display_name":"Horizon 2020 Framework Programme","ror":"https://ror.org/00k4n6c32"},{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2751958095.pdf","grobid_xml":"https://content.openalex.org/works/W2751958095.grobid-xml"},"referenced_works_count":28,"referenced_works":["https://openalex.org/W1556219185","https://openalex.org/W1606347560","https://openalex.org/W1677182931","https://openalex.org/W1988115241","https://openalex.org/W2013020033","https://openalex.org/W2042390666","https://openalex.org/W2059652044","https://openalex.org/W2137028279","https://openalex.org/W2176412452","https://openalex.org/W2198584637","https://openalex.org/W2337024056","https://openalex.org/W2404620398","https://openalex.org/W2575145750","https://openalex.org/W2721931776","https://openalex.org/W2756184659","https://openalex.org/W2914484425","https://openalex.org/W2949117887","https://openalex.org/W2963369619","https://openalex.org/W2963451564","https://openalex.org/W2963980515","https://openalex.org/W2964121744","https://openalex.org/W3210141620","https://openalex.org/W4255949318","https://openalex.org/W6631190155","https://openalex.org/W6712946787","https://openalex.org/W6715395060","https://openalex.org/W6732185156","https://openalex.org/W6740352302"],"related_works":["https://openalex.org/W2964285380","https://openalex.org/W2895105229","https://openalex.org/W2592944988","https://openalex.org/W1556219185","https://openalex.org/W2935162632","https://openalex.org/W2593179621","https://openalex.org/W2794150026","https://openalex.org/W2801356078","https://openalex.org/W2775123266","https://openalex.org/W3012971020","https://openalex.org/W2952003418","https://openalex.org/W2938078275","https://openalex.org/W3135186482","https://openalex.org/W2553581788","https://openalex.org/W2777468850","https://openalex.org/W2963517948","https://openalex.org/W3117786798","https://openalex.org/W3134834378","https://openalex.org/W2923260971","https://openalex.org/W2999819273"],"abstract_inverted_index":{"In":[0],"this":[1],"paper,":[2],"we":[3],"empirically":[4],"investigate":[5],"the":[6],"effect":[7],"of":[8],"audio":[9,23],"preprocessing":[10,24,43],"on":[11],"music":[12],"tagging":[13],"with":[14],"deep":[15],"neural":[16],"networks.":[17],"We":[18,36],"perform":[19],"comprehensive":[20],"experiments":[21],"involving":[22],"using":[25],"different":[26],"time-frequency":[27],"representations,":[28],"logarithmic":[29],"magnitude":[30,48],"compression,":[31],"frequency":[32],"weighting,":[33],"and":[34],"scaling.":[35],"show":[37],"that":[38],"many":[39],"commonly":[40],"used":[41],"input":[42],"techniques":[44],"are":[45],"redundant":[46],"except":[47],"compression.":[49]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2019,"cited_by_count":4},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":3}],"updated_date":"2026-03-25T23:56:10.502304","created_date":"2025-10-10T00:00:00"}
