{"id":"https://openalex.org/W4408352019","doi":"https://doi.org/10.1109/icassp49660.2025.10890633","title":"MusicMamba: A Dual-Feature Modeling Approach for Generating Chinese Traditional Music with Modal Precision","display_name":"MusicMamba: A Dual-Feature Modeling Approach for Generating Chinese Traditional Music with Modal Precision","publication_year":2025,"publication_date":"2025-03-12","ids":{"openalex":"https://openalex.org/W4408352019","doi":"https://doi.org/10.1109/icassp49660.2025.10890633"},"language":"en","primary_location":{"id":"doi:10.1109/icassp49660.2025.10890633","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10890633","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5064212351","display_name":"Jiatao Chen","orcid":"https://orcid.org/0000-0003-4484-7441"},"institutions":[{"id":"https://openalex.org/I196699116","display_name":"Wuhan University of Technology","ror":"https://ror.org/03fe7t173","country_code":"CN","type":"education","lineage":["https://openalex.org/I196699116"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiatao Chen","raw_affiliation_strings":["Wuhan University of Technology,School of Computer Science and Artificial Intelligence,Wuhan,China"],"affiliations":[{"raw_affiliation_string":"Wuhan University of Technology,School of Computer Science and Artificial Intelligence,Wuhan,China","institution_ids":["https://openalex.org/I196699116"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102318008","display_name":"Xing Tang","orcid":null},"institutions":[{"id":"https://openalex.org/I196699116","display_name":"Wuhan University of Technology","ror":"https://ror.org/03fe7t173","country_code":"CN","type":"education","lineage":["https://openalex.org/I196699116"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xing Tang","raw_affiliation_strings":["Wuhan University of Technology,School of Computer Science and Artificial Intelligence,Wuhan,China"],"affiliations":[{"raw_affiliation_string":"Wuhan University of Technology,School of Computer Science and Artificial Intelligence,Wuhan,China","institution_ids":["https://openalex.org/I196699116"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051602167","display_name":"Tianming Xie","orcid":"https://orcid.org/0000-0002-9187-9764"},"institutions":[{"id":"https://openalex.org/I196699116","display_name":"Wuhan University of Technology","ror":"https://ror.org/03fe7t173","country_code":"CN","type":"education","lineage":["https://openalex.org/I196699116"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tianming Xie","raw_affiliation_strings":["Wuhan University of Technology,School of Computer Science and Artificial Intelligence,Wuhan,China"],"affiliations":[{"raw_affiliation_string":"Wuhan University of Technology,School of Computer Science and Artificial Intelligence,Wuhan,China","institution_ids":["https://openalex.org/I196699116"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100765674","display_name":"Jing Wang","orcid":"https://orcid.org/0000-0002-1017-2231"},"institutions":[{"id":"https://openalex.org/I74525822","display_name":"Hubei University of Technology","ror":"https://ror.org/02d3fj342","country_code":"CN","type":"education","lineage":["https://openalex.org/I74525822"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jing Wang","raw_affiliation_strings":["Hubei University of Technology,School of Computer Science,Wuhan,China"],"affiliations":[{"raw_affiliation_string":"Hubei University of Technology,School of Computer Science,Wuhan,China","institution_ids":["https://openalex.org/I74525822"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107950470","display_name":"Wenjing Dong","orcid":"https://orcid.org/0009-0000-0604-5048"},"institutions":[{"id":"https://openalex.org/I196699116","display_name":"Wuhan University of Technology","ror":"https://ror.org/03fe7t173","country_code":"CN","type":"education","lineage":["https://openalex.org/I196699116"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenjing Dong","raw_affiliation_strings":["Wuhan University of Technology,School of Computer Science and Artificial Intelligence,Wuhan,China"],"affiliations":[{"raw_affiliation_string":"Wuhan University of Technology,School of Computer Science and Artificial Intelligence,Wuhan,China","institution_ids":["https://openalex.org/I196699116"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5029130019","display_name":"Bing Shi","orcid":"https://orcid.org/0000-0001-9117-1945"},"institutions":[{"id":"https://openalex.org/I196699116","display_name":"Wuhan University of Technology","ror":"https://ror.org/03fe7t173","country_code":"CN","type":"education","lineage":["https://openalex.org/I196699116"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bing Shi","raw_affiliation_strings":["Wuhan University of Technology,School of Computer Science and Artificial Intelligence,Wuhan,China"],"affiliations":[{"raw_affiliation_string":"Wuhan University of Technology,School of Computer Science and Artificial Intelligence,Wuhan,China","institution_ids":["https://openalex.org/I196699116"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5064212351"],"corresponding_institution_ids":["https://openalex.org/I196699116"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.05052015,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.991599977016449,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.991599977016449,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13996","display_name":"Diverse Musicological Studies","score":0.9469000101089478,"subfield":{"id":"https://openalex.org/subfields/1210","display_name":"Music"},"field":{"id":"https://openalex.org/fields/12","display_name":"Arts and Humanities"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.9157000184059143,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/dual","display_name":"Dual (grammatical number)","score":0.7498464584350586},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.736794114112854},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7102857828140259},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5770904421806335},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4287196397781372},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3784503638744354},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.05756556987762451}],"concepts":[{"id":"https://openalex.org/C2780980858","wikidata":"https://www.wikidata.org/wiki/Q110022","display_name":"Dual (grammatical number)","level":2,"score":0.7498464584350586},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.736794114112854},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7102857828140259},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5770904421806335},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4287196397781372},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3784503638744354},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.05756556987762451},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp49660.2025.10890633","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10890633","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320323172","display_name":"Natural Science Foundation of Chongqing","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W2601110281","https://openalex.org/W2809621972","https://openalex.org/W3038344852","https://openalex.org/W3092850823","https://openalex.org/W3092879656","https://openalex.org/W3097469673","https://openalex.org/W4212820163","https://openalex.org/W4386510708","https://openalex.org/W6704583309","https://openalex.org/W6749351710","https://openalex.org/W6760601182","https://openalex.org/W6781678156","https://openalex.org/W6781910838","https://openalex.org/W6782288222","https://openalex.org/W6782602824","https://openalex.org/W6790487804","https://openalex.org/W6803444062","https://openalex.org/W6810771649","https://openalex.org/W6841205203","https://openalex.org/W6849063711","https://openalex.org/W6859298233","https://openalex.org/W6861342692","https://openalex.org/W6863493712","https://openalex.org/W6870066658"],"related_works":["https://openalex.org/W2317351040","https://openalex.org/W2379392295","https://openalex.org/W3160965418","https://openalex.org/W613940353","https://openalex.org/W2320915480","https://openalex.org/W2952466936","https://openalex.org/W3147584709","https://openalex.org/W1988622314","https://openalex.org/W2393949104","https://openalex.org/W4236344264"],"abstract_inverted_index":{"In":[0],"recent":[1],"years,":[2],"deep":[3],"learning":[4],"has":[5],"advanced":[6],"the":[7,47,53,57,61,66,72,95],"MIDI":[8],"domain,":[9],"solidifying":[10],"music":[11,117,137,144],"generation":[12],"as":[13],"a":[14,113,140],"key":[15],"application":[16],"of":[17,56,65,123],"artificial":[18],"intelligence.":[19],"However,":[20],"most":[21],"research":[22],"focuses":[23],"on":[24,91],"Western":[25],"music,":[26],"facing":[27],"challenges":[28],"in":[29,35,105,131],"generating":[30,132],"Chinese":[31,115,135],"traditional":[32,116,136],"melodies,":[33],"particularly":[34],"capturing":[36,64],"modal":[37,103],"characteristics":[38],"and":[39,81,101],"emotional":[40],"expression.":[41],"To":[42,107],"address":[43],"this,":[44,92,109],"we":[45,70,93,110],"propose":[46,94],"Dual-Feature":[48],"Modeling":[49],"Module,":[50],"which":[51,77],"integrates":[52,78],"long-range":[54],"modeling":[55],"Mamba":[58,74],"Block":[59],"with":[60,134],"global":[62,82],"structure":[63],"Transformer":[67],"Block.":[68],"Additionally,":[69],"introduce":[71],"Bidirectional":[73],"Fusion":[75],"Layer,":[76],"local":[79],"details":[80],"structures":[83],"through":[84],"bidirectional":[85],"scanning,":[86],"enhancing":[87],"sequence":[88],"modeling.":[89],"Building":[90],"REMI-M":[96],"representation":[97],"to":[98],"better":[99],"capture":[100],"generate":[102],"information":[104],"melodies.":[106],"support":[108],"developed":[111],"FolkDB,":[112],"high-quality":[114],"dataset":[118],"covering":[119],"over":[120],"11":[121],"hours":[122],"music.":[124],"Experimental":[125],"results":[126],"show":[127],"our":[128],"architecture":[129],"excels":[130],"melodies":[133],"characteristics,":[138],"offering":[139],"new":[141],"solution":[142],"for":[143],"generation.":[145]},"counts_by_year":[],"updated_date":"2025-12-28T23:10:05.387466","created_date":"2025-10-10T00:00:00"}
