{"id":"https://openalex.org/W2585464829","doi":"https://doi.org/10.1109/iscslp.2016.7918369","title":"Long short-term memory recurrent neural network based segment features for music genre classification","display_name":"Long short-term memory recurrent neural network based segment features for music genre classification","publication_year":2016,"publication_date":"2016-10-01","ids":{"openalex":"https://openalex.org/W2585464829","doi":"https://doi.org/10.1109/iscslp.2016.7918369","mag":"2585464829"},"language":"en","primary_location":{"id":"doi:10.1109/iscslp.2016.7918369","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iscslp.2016.7918369","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 10th International Symposium on Chinese Spoken Language Processing (ISCSLP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5012133457","display_name":"Jia Dai","orcid":null},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jia Dai","raw_affiliation_strings":["University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027369782","display_name":"Liang Shan","orcid":"https://orcid.org/0000-0002-8833-2514"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shan Liang","raw_affiliation_strings":["University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100652844","display_name":"Wei Xue","orcid":"https://orcid.org/0000-0002-4942-7748"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Xue","raw_affiliation_strings":["University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102306089","display_name":"Chongjia Ni","orcid":null},"institutions":[{"id":"https://openalex.org/I59483232","display_name":"Shandong University of Finance and Economics","ror":"https://ror.org/02e2nnq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I59483232"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chongjia Ni","raw_affiliation_strings":["Shandong University of Finance and Economics, shandong, China"],"affiliations":[{"raw_affiliation_string":"Shandong University of Finance and Economics, shandong, China","institution_ids":["https://openalex.org/I59483232"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5039635290","display_name":"Wenju Liu","orcid":"https://orcid.org/0000-0001-9088-8282"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenju Liu","raw_affiliation_strings":["University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5012133457"],"corresponding_institution_ids":["https://openalex.org/I4210165038"],"apc_list":null,"apc_paid":null,"fwci":1.7839,"has_fulltext":false,"cited_by_count":43,"citation_normalized_percentile":{"value":0.86866482,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8121819496154785},{"id":"https://openalex.org/keywords/recurrent-neural-network","display_name":"Recurrent neural network","score":0.7768994569778442},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.7420332431793213},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.7241286635398865},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6764341592788696},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5807475447654724},{"id":"https://openalex.org/keywords/long-short-term-memory","display_name":"Long short term memory","score":0.5343044996261597},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.49747446179389954},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.4409904181957245},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.4302322268486023},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.4107985198497772},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4086267948150635}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8121819496154785},{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.7768994569778442},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.7420332431793213},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.7241286635398865},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6764341592788696},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5807475447654724},{"id":"https://openalex.org/C133488467","wikidata":"https://www.wikidata.org/wiki/Q6673524","display_name":"Long short term memory","level":4,"score":0.5343044996261597},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.49747446179389954},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.4409904181957245},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.4302322268486023},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.4107985198497772},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4086267948150635},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/iscslp.2016.7918369","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iscslp.2016.7918369","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 10th International Symposium on Chinese Spoken Language Processing (ISCSLP)","raw_type":"proceedings-article"},{"id":"pmh:oai:repository.hkust.edu.hk:1783.1-125455","is_oa":false,"landing_page_url":"http://lbdiscover.ust.hk/uresolver?url_ver=Z39.88-2004&rft_val_fmt=info:ofi/fmt:kev:mtx:journal&rfr_id=info:sid/HKUST:SPI&rft.genre=article&rft.issn=&rft.volume=&rft.issue=&rft.date=2017&rft.spage=&rft.aulast=Dai&rft.aufirst=&rft.atitle=Long+short-term+memory+recurrent+neural+network+based+segment+features+for+music+genre+classification&rft.title=Proceedings+of+2016+10th+International+Symposium+on+Chinese+Spoken+Language+Processing%2C+ISCSLP+2016","pdf_url":null,"source":{"id":"https://openalex.org/S4306401796","display_name":"Rare & Special e-Zone (The Hong Kong University of Science and Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I200769079","host_organization_name":"Hong Kong University of Science and Technology","host_organization_lineage":["https://openalex.org/I200769079"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Conference paper"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","score":0.4699999988079071,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":27,"referenced_works":["https://openalex.org/W1496120315","https://openalex.org/W1509691205","https://openalex.org/W1515441714","https://openalex.org/W1601124178","https://openalex.org/W1966838590","https://openalex.org/W1970578576","https://openalex.org/W1975126845","https://openalex.org/W2071103260","https://openalex.org/W2093231248","https://openalex.org/W2101252291","https://openalex.org/W2104352833","https://openalex.org/W2110589736","https://openalex.org/W2128196382","https://openalex.org/W2136848157","https://openalex.org/W2142236629","https://openalex.org/W2147768505","https://openalex.org/W2295001676","https://openalex.org/W2299804884","https://openalex.org/W2368991465","https://openalex.org/W2396025094","https://openalex.org/W2396346931","https://openalex.org/W2398751993","https://openalex.org/W2404938947","https://openalex.org/W6641716162","https://openalex.org/W6712550616","https://openalex.org/W6712642569","https://openalex.org/W6713805741"],"related_works":["https://openalex.org/W2912153778","https://openalex.org/W4387163678","https://openalex.org/W4288108708","https://openalex.org/W2973430807","https://openalex.org/W4385280324","https://openalex.org/W2890685186","https://openalex.org/W2984436043","https://openalex.org/W4390245176","https://openalex.org/W2912831041","https://openalex.org/W3173606726"],"abstract_inverted_index":{"In":[0,77],"the":[1,10,19,28,36,82,99,109,118,125,134,145,152,156,168,180,183],"conventional":[2],"frame":[3,103,112,130,153],"feature":[4,63,121,131,148,159],"based":[5,85],"music":[6,89],"genre":[7,90],"classification":[8,37,162],"methods,":[9],"audio":[11,23],"data":[12],"is":[13,24,31,95,122],"represented":[14],"by":[15],"independent":[16],"frames":[17],"and":[18,34,73],"sequential":[20,29],"nature":[21],"of":[22,55,101,111,128,182],"totally":[25],"ignored.":[26],"If":[27],"knowledge":[30],"well":[32],"modeled":[33],"combined,":[35],"performance":[38],"can":[39],"be":[40],"significantly":[41],"improved.":[42],"The":[43,92,105,138],"long":[44],"short-term":[45],"memory(LSTM)":[46],"recurrent":[47],"neural":[48,173],"network":[49,174],"(RNN)":[50],"which":[51],"uses":[52],"a":[53],"set":[54],"special":[56],"memory":[57],"cells":[58],"to":[59,97,132],"model":[60,170],"for":[61,69,88],"long-range":[62],"sequence,":[64],"has":[65],"been":[66],"successfully":[67],"used":[68,96],"many":[70],"sequence":[71,74],"labeling":[72],"prediction":[75],"tasks.":[76],"this":[78],"paper,":[79],"we":[80],"propose":[81],"LSTM":[83,93,102,119,146],"RNN":[84,94],"segment":[86,106,120,126,136,147,158,185],"features":[87,107,113],"classification.":[91],"learn":[98],"representation":[100,127],"feature.":[104,137,154,186],"are":[108],"statistics":[110],"in":[114],"each":[115],"segment.":[116],"Furthermore,":[117],"combined":[123],"with":[124],"initial":[129],"obtain":[133],"fusional":[135,157],"evaluation":[139],"on":[140],"ISMIR":[141],"database":[142],"show":[143,179],"that":[144],"performs":[149],"better":[150],"than":[151],"Overall,":[155],"achieves":[160],"89.71%":[161],"accuracy,":[163],"about":[164],"4.19%":[165],"improvement":[166,178],"over":[167],"baseline":[169],"using":[171],"deep":[172],"(DNN).":[175],"This":[176],"significant":[177],"effectiveness":[181],"proposed":[184]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":11},{"year":2022,"cited_by_count":7},{"year":2021,"cited_by_count":6},{"year":2020,"cited_by_count":5},{"year":2019,"cited_by_count":5},{"year":2018,"cited_by_count":2}],"updated_date":"2026-03-06T13:50:29.536080","created_date":"2025-10-10T00:00:00"}
