{"id":"https://openalex.org/W3199367802","doi":"https://doi.org/10.1109/compsac51774.2021.00140","title":"Parallel Deep Neural Networks for Musical Genre Classification: A Case Study","display_name":"Parallel Deep Neural Networks for Musical Genre Classification: A Case Study","publication_year":2021,"publication_date":"2021-07-01","ids":{"openalex":"https://openalex.org/W3199367802","doi":"https://doi.org/10.1109/compsac51774.2021.00140","mag":"3199367802"},"language":"en","primary_location":{"id":"doi:10.1109/compsac51774.2021.00140","is_oa":false,"landing_page_url":"https://doi.org/10.1109/compsac51774.2021.00140","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE 45th Annual Computers, Software, and Applications Conference (COMPSAC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101437652","display_name":"Hui Yuan","orcid":"https://orcid.org/0000-0002-9099-7259"},"institutions":[{"id":"https://openalex.org/I164389053","display_name":"Fordham University","ror":"https://ror.org/03qnxaf80","country_code":"US","type":"education","lineage":["https://openalex.org/I164389053"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Hui Yuan","raw_affiliation_strings":["Fordham University,Computer and Information Science Department,NY,NY,10023"],"affiliations":[{"raw_affiliation_string":"Fordham University,Computer and Information Science Department,NY,NY,10023","institution_ids":["https://openalex.org/I164389053"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045059848","display_name":"Wenjia Zheng","orcid":null},"institutions":[{"id":"https://openalex.org/I164389053","display_name":"Fordham University","ror":"https://ror.org/03qnxaf80","country_code":"US","type":"education","lineage":["https://openalex.org/I164389053"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Wenjia Zheng","raw_affiliation_strings":["Fordham University,Computer and Information Science Department,NY,NY,10023"],"affiliations":[{"raw_affiliation_string":"Fordham University,Computer and Information Science Department,NY,NY,10023","institution_ids":["https://openalex.org/I164389053"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050837693","display_name":"Yun S. Song","orcid":"https://orcid.org/0000-0002-0734-9868"},"institutions":[{"id":"https://openalex.org/I164389053","display_name":"Fordham University","ror":"https://ror.org/03qnxaf80","country_code":"US","type":"education","lineage":["https://openalex.org/I164389053"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yun Song","raw_affiliation_strings":["Fordham University,Computer and Information Science Department,NY,NY,10023"],"affiliations":[{"raw_affiliation_string":"Fordham University,Computer and Information Science Department,NY,NY,10023","institution_ids":["https://openalex.org/I164389053"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5049423390","display_name":"Yijun Zhao","orcid":"https://orcid.org/0000-0003-2424-5988"},"institutions":[{"id":"https://openalex.org/I164389053","display_name":"Fordham University","ror":"https://ror.org/03qnxaf80","country_code":"US","type":"education","lineage":["https://openalex.org/I164389053"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yijun Zhao","raw_affiliation_strings":["Fordham University,Computer and Information Science Department,NY,NY,10023"],"affiliations":[{"raw_affiliation_string":"Fordham University,Computer and Information Science Department,NY,NY,10023","institution_ids":["https://openalex.org/I164389053"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5101437652"],"corresponding_institution_ids":["https://openalex.org/I164389053"],"apc_list":null,"apc_paid":null,"fwci":0.7618,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.71176471,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"10","issue":null,"first_page":"1032","last_page":"1035"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.9918000102043152,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10788","display_name":"Neuroscience and Music Perception","score":0.9829999804496765,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7892209887504578},{"id":"https://openalex.org/keywords/spectrogram","display_name":"Spectrogram","score":0.6647500991821289},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5803413391113281},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5203644633293152},{"id":"https://openalex.org/keywords/music-information-retrieval","display_name":"Music information retrieval","score":0.49822497367858887},{"id":"https://openalex.org/keywords/categorization","display_name":"Categorization","score":0.47595450282096863},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.47411587834358215},{"id":"https://openalex.org/keywords/rhythm","display_name":"Rhythm","score":0.4215218424797058},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.4214667081832886},{"id":"https://openalex.org/keywords/musical","display_name":"Musical","score":0.38947147130966187},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.389036625623703},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3708992004394531}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7892209887504578},{"id":"https://openalex.org/C45273575","wikidata":"https://www.wikidata.org/wiki/Q578970","display_name":"Spectrogram","level":2,"score":0.6647500991821289},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5803413391113281},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5203644633293152},{"id":"https://openalex.org/C2777946086","wikidata":"https://www.wikidata.org/wiki/Q1163335","display_name":"Music information retrieval","level":3,"score":0.49822497367858887},{"id":"https://openalex.org/C94124525","wikidata":"https://www.wikidata.org/wiki/Q912550","display_name":"Categorization","level":2,"score":0.47595450282096863},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.47411587834358215},{"id":"https://openalex.org/C135343436","wikidata":"https://www.wikidata.org/wiki/Q170406","display_name":"Rhythm","level":2,"score":0.4215218424797058},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.4214667081832886},{"id":"https://openalex.org/C558565934","wikidata":"https://www.wikidata.org/wiki/Q2743","display_name":"Musical","level":2,"score":0.38947147130966187},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.389036625623703},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3708992004394531},{"id":"https://openalex.org/C107038049","wikidata":"https://www.wikidata.org/wiki/Q35986","display_name":"Aesthetics","level":1,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/compsac51774.2021.00140","is_oa":false,"landing_page_url":"https://doi.org/10.1109/compsac51774.2021.00140","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE 45th Annual Computers, Software, and Applications Conference (COMPSAC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.5600000023841858,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W1905882502","https://openalex.org/W2064675550","https://openalex.org/W2117539524","https://openalex.org/W2133824856","https://openalex.org/W2163605009","https://openalex.org/W2194775991","https://openalex.org/W2297628473","https://openalex.org/W2340134902","https://openalex.org/W2514413323","https://openalex.org/W2520164769","https://openalex.org/W2613155248","https://openalex.org/W2747932385","https://openalex.org/W2766736793","https://openalex.org/W2779371882","https://openalex.org/W2919115771","https://openalex.org/W2951326654","https://openalex.org/W2963451564","https://openalex.org/W2975625678","https://openalex.org/W6684191040","https://openalex.org/W6697356650","https://openalex.org/W6704025895","https://openalex.org/W6726381175","https://openalex.org/W6727654133","https://openalex.org/W6747722063"],"related_works":["https://openalex.org/W2530685530","https://openalex.org/W4375868962","https://openalex.org/W2011227383","https://openalex.org/W2088854863","https://openalex.org/W4402568167","https://openalex.org/W3179495260","https://openalex.org/W1976719989","https://openalex.org/W3127543252","https://openalex.org/W2065606036","https://openalex.org/W3135448569"],"abstract_inverted_index":{"Musical":[0],"genres":[1],"are":[2],"labels":[3],"created":[4],"to":[5,38,55,105,212],"categorize":[6],"the":[7,56,64,67,95,124,175,187,190,197,214],"universe":[8],"of":[9,36,59,94,149,163,172,196,220],"music.":[10],"A":[11],"music":[12,37,45,62,113,150,221],"genre":[13,42,46,184],"is":[14,30,48],"characterized":[15],"by":[16],"its":[17],"unique":[18],"form":[19],"or":[20],"style,":[21],"including":[22],"instrumentation,":[23],"rhythmic":[24],"structure,":[25],"and":[26,66,102,109,136,151,217],"harmonic":[27],"content.":[28],"It":[29],"conventional":[31],"for":[32,206],"a":[33,91,129,141,160],"large":[34,57],"collection":[35],"be":[39],"structured":[40],"using":[41,140],"hierarchies.":[43],"Automatic":[44],"classification":[47],"gaining":[49],"attention":[50],"in":[51,70,83,182],"recent":[52],"years":[53],"due":[54],"amount":[58],"available":[60],"digital":[61],"on":[63,123,159,174],"web":[65],"latest":[68],"advances":[69],"artificial":[71],"intelligence.":[72],"In":[73,86,115],"particular,":[74],"various":[75],"deep":[76,209],"learning-based":[77],"approaches":[78],"have":[79],"delivered":[80],"promising":[81],"results":[82,202],"this":[84,87],"domain.":[85],"paper,":[88],"we":[89,118,134],"present":[90],"case":[92],"study":[93],"PRCNN":[96],"framework":[97],"(2017),":[98],"which":[99],"parallelizes":[100],"CNN":[101],"bi-directional":[103],"GRU":[104],"capture":[106],"both":[107],"spatial":[108,216],"temporal":[110,218],"signals":[111],"from":[112],"spectrograms.":[114],"our":[116,120,138,157],"study,":[117],"designed":[119],"model":[121,131,139,158,167,191,213],"based":[122],"proposed":[125],"concept":[126],"but":[127],"with":[128,146,178],"different":[130],"structure.":[132],"Furthermore,":[133],"trained":[135],"evaluated":[137],"more":[142],"comprehensive":[143],"dataset":[144,162,177],"(FMA)":[145],"8,252":[147],"pieces":[148],"17":[152],"genres.":[153],"We":[154],"further":[155],"validated":[156],"curated":[161,188],"15":[164,198],"songs.":[165,199],"Our":[166,200],"achieves":[168],"an":[169],"overall":[170],"accuracy":[171],"88%":[173],"FMA":[176],"above":[179],"90%":[180],"accuracies":[181],"four":[183],"categories.":[185],"For":[186],"dataset,":[189],"correctly":[192],"classified":[193],"11":[194],"out":[195],"experimental":[201],"provide":[203],"convincing":[204],"support":[205],"utilizing":[207],"parallelized":[208],"neural":[210],"networks":[211],"concurrent":[215],"characteristics":[219],"data.":[222]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
