{"id":"https://openalex.org/W3160397857","doi":"https://doi.org/10.1109/ssci50451.2021.9659979","title":"1D CNN Architectures for Music Genre Classification","display_name":"1D CNN Architectures for Music Genre Classification","publication_year":2021,"publication_date":"2021-12-05","ids":{"openalex":"https://openalex.org/W3160397857","doi":"https://doi.org/10.1109/ssci50451.2021.9659979","mag":"3160397857"},"language":"en","primary_location":{"id":"doi:10.1109/ssci50451.2021.9659979","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ssci50451.2021.9659979","pdf_url":null,"source":{"id":"https://openalex.org/S4363604921","display_name":"2021 IEEE Symposium Series on Computational Intelligence (SSCI)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE Symposium Series on Computational Intelligence (SSCI)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2105.07302","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5081396321","display_name":"Safaa Allamy","orcid":null},"institutions":[{"id":"https://openalex.org/I9736820","display_name":"\u00c9cole de Technologie Sup\u00e9rieure","ror":"https://ror.org/0020snb74","country_code":"CA","type":"education","lineage":["https://openalex.org/I49663120","https://openalex.org/I9736820"]},{"id":"https://openalex.org/I159129438","display_name":"Universit\u00e9 du Qu\u00e9bec \u00e0 Montr\u00e9al","ror":"https://ror.org/002rjbv21","country_code":"CA","type":"education","lineage":["https://openalex.org/I159129438","https://openalex.org/I49663120"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"Safaa Allamy","raw_affiliation_strings":["Ecole de Technologie Sup\u00e9rieure Universit\u00e9 du Qu\u00e9bec, Montreal, QC, Canada"],"affiliations":[{"raw_affiliation_string":"Ecole de Technologie Sup\u00e9rieure Universit\u00e9 du Qu\u00e9bec, Montreal, QC, Canada","institution_ids":["https://openalex.org/I9736820","https://openalex.org/I159129438"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5074262951","display_name":"Alessandro L. Koerich","orcid":"https://orcid.org/0000-0001-5879-7014"},"institutions":[{"id":"https://openalex.org/I159129438","display_name":"Universit\u00e9 du Qu\u00e9bec \u00e0 Montr\u00e9al","ror":"https://ror.org/002rjbv21","country_code":"CA","type":"education","lineage":["https://openalex.org/I159129438","https://openalex.org/I49663120"]},{"id":"https://openalex.org/I9736820","display_name":"\u00c9cole de Technologie Sup\u00e9rieure","ror":"https://ror.org/0020snb74","country_code":"CA","type":"education","lineage":["https://openalex.org/I49663120","https://openalex.org/I9736820"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Alessandro Lameiras Koerich","raw_affiliation_strings":["Ecole de Technologie Sup\u00e9rieure Universit\u00e9 du Qu\u00e9bec, Montreal, QC, Canada","Ecole de technologie sup\u00e9rieure"],"affiliations":[{"raw_affiliation_string":"Ecole de Technologie Sup\u00e9rieure Universit\u00e9 du Qu\u00e9bec, Montreal, QC, Canada","institution_ids":["https://openalex.org/I9736820","https://openalex.org/I159129438"]},{"raw_affiliation_string":"Ecole de technologie sup\u00e9rieure","institution_ids":["https://openalex.org/I9736820"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5081396321"],"corresponding_institution_ids":["https://openalex.org/I159129438","https://openalex.org/I9736820"],"apc_list":null,"apc_paid":null,"fwci":0.5163,"has_fulltext":true,"cited_by_count":3,"citation_normalized_percentile":{"value":0.62786003,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"01","last_page":"07"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9952999949455261,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7971620559692383},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.6821185350418091},{"id":"https://openalex.org/keywords/audio-signal","display_name":"Audio signal","score":0.6101071238517761},{"id":"https://openalex.org/keywords/residual","display_name":"Residual","score":0.6032808423042297},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5445535182952881},{"id":"https://openalex.org/keywords/constraint","display_name":"Constraint (computer-aided design)","score":0.5436034798622131},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5075761079788208},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5031477808952332},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4934288561344147},{"id":"https://openalex.org/keywords/signal","display_name":"SIGNAL (programming language)","score":0.47818997502326965},{"id":"https://openalex.org/keywords/audio-analyzer","display_name":"Audio analyzer","score":0.45245230197906494},{"id":"https://openalex.org/keywords/digital-audio","display_name":"Digital audio","score":0.4353538155555725},{"id":"https://openalex.org/keywords/speech-coding","display_name":"Speech coding","score":0.11535507440567017},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.11488887667655945},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.08857274055480957}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7971620559692383},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.6821185350418091},{"id":"https://openalex.org/C64922751","wikidata":"https://www.wikidata.org/wiki/Q4650799","display_name":"Audio signal","level":3,"score":0.6101071238517761},{"id":"https://openalex.org/C155512373","wikidata":"https://www.wikidata.org/wiki/Q287450","display_name":"Residual","level":2,"score":0.6032808423042297},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5445535182952881},{"id":"https://openalex.org/C2776036281","wikidata":"https://www.wikidata.org/wiki/Q48769818","display_name":"Constraint (computer-aided design)","level":2,"score":0.5436034798622131},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5075761079788208},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5031477808952332},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4934288561344147},{"id":"https://openalex.org/C2779843651","wikidata":"https://www.wikidata.org/wiki/Q7390335","display_name":"SIGNAL (programming language)","level":2,"score":0.47818997502326965},{"id":"https://openalex.org/C160372630","wikidata":"https://www.wikidata.org/wiki/Q4819855","display_name":"Audio analyzer","level":5,"score":0.45245230197906494},{"id":"https://openalex.org/C87687168","wikidata":"https://www.wikidata.org/wiki/Q173114","display_name":"Digital audio","level":4,"score":0.4353538155555725},{"id":"https://openalex.org/C13895895","wikidata":"https://www.wikidata.org/wiki/Q3270773","display_name":"Speech coding","level":2,"score":0.11535507440567017},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.11488887667655945},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.08857274055480957},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0}],"mesh":[],"locations_count":5,"locations":[{"id":"doi:10.1109/ssci50451.2021.9659979","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ssci50451.2021.9659979","pdf_url":null,"source":{"id":"https://openalex.org/S4363604921","display_name":"2021 IEEE Symposium Series on Computational Intelligence (SSCI)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE Symposium Series on Computational Intelligence (SSCI)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2105.07302","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2105.07302","pdf_url":"https://arxiv.org/pdf/2105.07302","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"mag:3160397857","is_oa":true,"landing_page_url":"https://arxiv.org/pdf/2105.07302v1","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"pmh:oai:espace2.etsmtl.ca:24133","is_oa":false,"landing_page_url":"https://espace2.etsmtl.ca/id/eprint/24133/","pdf_url":null,"source":{"id":"https://openalex.org/S4306402392","display_name":"Espace \u00c9TS (ETS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1341030882","host_organization_name":"Educational Testing Service","host_organization_lineage":["https://openalex.org/I1341030882"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Compte rendu de conf\u00e9rence"},{"id":"doi:10.48550/arxiv.2105.07302","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2105.07302","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2105.07302","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2105.07302","pdf_url":"https://arxiv.org/pdf/2105.07302","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[{"score":0.699999988079071,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3160397857.pdf","grobid_xml":"https://content.openalex.org/works/W3160397857.grobid-xml"},"referenced_works_count":40,"referenced_works":["https://openalex.org/W1421840687","https://openalex.org/W1560641100","https://openalex.org/W1653228644","https://openalex.org/W1966311970","https://openalex.org/W2059652044","https://openalex.org/W2100700860","https://openalex.org/W2101151533","https://openalex.org/W2124541215","https://openalex.org/W2133824856","https://openalex.org/W2138266693","https://openalex.org/W2138423018","https://openalex.org/W2149969775","https://openalex.org/W2194775991","https://openalex.org/W2398826216","https://openalex.org/W2520160253","https://openalex.org/W2563031223","https://openalex.org/W2758738105","https://openalex.org/W2794150026","https://openalex.org/W2935162632","https://openalex.org/W2962813390","https://openalex.org/W2963181423","https://openalex.org/W2963358591","https://openalex.org/W2963451564","https://openalex.org/W2963493667","https://openalex.org/W2963669405","https://openalex.org/W2963838685","https://openalex.org/W2964218314","https://openalex.org/W2993396030","https://openalex.org/W3045302321","https://openalex.org/W3091508658","https://openalex.org/W4239611119","https://openalex.org/W6628411372","https://openalex.org/W6633570323","https://openalex.org/W6727336983","https://openalex.org/W6730401039","https://openalex.org/W6732646663","https://openalex.org/W6741185346","https://openalex.org/W6745878906","https://openalex.org/W6769748652","https://openalex.org/W6781326571"],"related_works":["https://openalex.org/W2997091880","https://openalex.org/W3162646160","https://openalex.org/W3014800401","https://openalex.org/W2784006950","https://openalex.org/W3180921123","https://openalex.org/W2801661609","https://openalex.org/W3032019894","https://openalex.org/W2549104515","https://openalex.org/W2963232038","https://openalex.org/W2012296273","https://openalex.org/W2969426323","https://openalex.org/W2902922150","https://openalex.org/W3105202226","https://openalex.org/W2734984521","https://openalex.org/W2989838200","https://openalex.org/W3027136955","https://openalex.org/W2794355319","https://openalex.org/W2904230401","https://openalex.org/W2787229240"],"abstract_inverted_index":{"This":[0],"paper":[1],"proposes":[2],"a":[3,28,31,72,87,97,126],"1D":[4,21,25,84,120,152],"residual":[5,121],"convolutional":[6,40],"neural":[7],"network":[8],"(CNN)":[9],"architecture":[10],"for":[11],"music":[12,57,89,147],"genre":[13,58,90],"classification":[14,91],"and":[15,30,50,149],"compares":[16],"it":[17,139],"with":[18,77],"other":[19,151],"recent":[20],"CNN":[22,122,153],"architectures.":[23,154],"The":[24,61,115,133],"CNNs":[26],"learn":[27,51],"representation":[29],"discriminant":[32],"directly":[33],"from":[34],"the":[35,43,47,56,65,78,83,104,112,118],"raw":[36],"audio":[37,48,66,99,108,131],"signal.":[38],"Several":[39],"layers":[41],"capture":[42],"time-frequency":[44],"characteristics":[45],"of":[46,82,117,129,142],"signal":[49,67],"various":[52],"filters":[53],"relevant":[54],"to":[55,75],"recognition":[59],"task.":[60],"proposed":[62,119],"approach":[63],"splits":[64],"into":[68],"overlapped":[69],"segments":[70],"using":[71],"sliding":[73],"window":[74],"comply":[76],"fixed-length":[79],"input":[80],"constraint":[81],"CNNs.":[85],"As":[86],"result,":[88],"can":[92],"be":[93],"carried":[94],"out":[95],"on":[96,102,106,125],"single":[98],"segment":[100],"or":[101],"aggregating":[103],"predictions":[105],"several":[107],"segments,":[109],"which":[110],"improves":[111],"final":[113],"accuracy.":[114],"performance":[116],"is":[123],"assessed":[124],"public":[127],"dataset":[128],"1,000":[130],"clips.":[132],"experimental":[134],"results":[135],"have":[136],"shown":[137],"that":[138],"achieves":[140],"80.93%":[141],"mean":[143],"accuracy":[144],"in":[145],"classifying":[146],"genres":[148],"outperforms":[150]},"counts_by_year":[{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1}],"updated_date":"2026-03-10T16:38:18.471706","created_date":"2025-10-10T00:00:00"}
