{"id":"https://openalex.org/W4414359717","doi":"https://doi.org/10.24963/ijcai.2025/1134","title":"NotaGen: Advancing Musicality in Symbolic Music Generation with Large Language Model Training Paradigms","display_name":"NotaGen: Advancing Musicality in Symbolic Music Generation with Large Language Model Training Paradigms","publication_year":2025,"publication_date":"2025-09-01","ids":{"openalex":"https://openalex.org/W4414359717","doi":"https://doi.org/10.24963/ijcai.2025/1134"},"language":"en","primary_location":{"id":"doi:10.24963/ijcai.2025/1134","is_oa":false,"landing_page_url":"https://doi.org/10.24963/ijcai.2025/1134","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Thirty-Fourth International Joint Conference on Artificial Intelligence","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5083052094","display_name":"Yashan Wang","orcid":"https://orcid.org/0000-0003-3379-1999"},"institutions":[{"id":"https://openalex.org/I2799899675","display_name":"Central Conservatory of Music","ror":"https://ror.org/01pxc4g62","country_code":"CN","type":"education","lineage":["https://openalex.org/I2799899675"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yashan Wang","raw_affiliation_strings":["Central Conservatory of Music, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Central Conservatory of Music, China","institution_ids":["https://openalex.org/I2799899675"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078252194","display_name":"Shangda Wu","orcid":null},"institutions":[{"id":"https://openalex.org/I2799899675","display_name":"Central Conservatory of Music","ror":"https://ror.org/01pxc4g62","country_code":"CN","type":"education","lineage":["https://openalex.org/I2799899675"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shangda Wu","raw_affiliation_strings":["Central Conservatory of Music, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Central Conservatory of Music, China","institution_ids":["https://openalex.org/I2799899675"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046482790","display_name":"James Lee Hu","orcid":"https://orcid.org/0009-0009-5112-6280"},"institutions":[{"id":"https://openalex.org/I2799899675","display_name":"Central Conservatory of Music","ror":"https://ror.org/01pxc4g62","country_code":"CN","type":"education","lineage":["https://openalex.org/I2799899675"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianhuai Hu","raw_affiliation_strings":["Central Conservatory of Music, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Central Conservatory of Music, China","institution_ids":["https://openalex.org/I2799899675"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091528537","display_name":"Xingjian Du","orcid":null},"institutions":[{"id":"https://openalex.org/I5388228","display_name":"University of Rochester","ror":"https://ror.org/022kthw22","country_code":"US","type":"education","lineage":["https://openalex.org/I5388228"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xingjian Du","raw_affiliation_strings":["University of Rochester, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Rochester, USA","institution_ids":["https://openalex.org/I5388228"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Yueqi Peng","orcid":null},"institutions":[{"id":"https://openalex.org/I4210141517","display_name":"Nuctech (China)","ror":"https://ror.org/057vhsp23","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210141517"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yueqi Peng","raw_affiliation_strings":["Beijing Flowingtech Ltd., China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Beijing Flowingtech Ltd., China","institution_ids":["https://openalex.org/I4210141517"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019644611","display_name":"Yongxin Huang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yongxin Huang","raw_affiliation_strings":["Independent Researcher"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Independent Researcher","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041221926","display_name":"Shuai Fan","orcid":"https://orcid.org/0000-0002-1227-5154"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuai Fan","raw_affiliation_strings":["Beihang University, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Beihang University, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100375517","display_name":"Xiaobing Li","orcid":"https://orcid.org/0000-0001-5961-2114"},"institutions":[{"id":"https://openalex.org/I2799899675","display_name":"Central Conservatory of Music","ror":"https://ror.org/01pxc4g62","country_code":"CN","type":"education","lineage":["https://openalex.org/I2799899675"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaobing Li","raw_affiliation_strings":["Central Conservatory of Music, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Central Conservatory of Music, China","institution_ids":["https://openalex.org/I2799899675"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049175891","display_name":"Feng Yu","orcid":"https://orcid.org/0009-0007-0607-7315"},"institutions":[{"id":"https://openalex.org/I2799899675","display_name":"Central Conservatory of Music","ror":"https://ror.org/01pxc4g62","country_code":"CN","type":"education","lineage":["https://openalex.org/I2799899675"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Feng Yu","raw_affiliation_strings":["Central Conservatory of Music, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Central Conservatory of Music, China","institution_ids":["https://openalex.org/I2799899675"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5046448314","display_name":"Maosong Sun","orcid":"https://orcid.org/0000-0002-6011-6115"},"institutions":[{"id":"https://openalex.org/I2799899675","display_name":"Central Conservatory of Music","ror":"https://ror.org/01pxc4g62","country_code":"CN","type":"education","lineage":["https://openalex.org/I2799899675"]},{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Maosong Sun","raw_affiliation_strings":["Central Conservatory of Music, China","Tsinghua University, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Central Conservatory of Music, China","institution_ids":["https://openalex.org/I2799899675"]},{"raw_affiliation_string":"Tsinghua University, China","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":10,"corresponding_author_ids":["https://openalex.org/A5083052094"],"corresponding_institution_ids":["https://openalex.org/I2799899675"],"apc_list":null,"apc_paid":null,"fwci":8.6731,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.98110703,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"10207","last_page":"10215"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.944100022315979,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.944100022315979,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.9429000020027161,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/musicality","display_name":"Musicality","score":0.541700005531311},{"id":"https://openalex.org/keywords/the-symbolic","display_name":"The Symbolic","score":0.5310999751091003},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.4794999957084656},{"id":"https://openalex.org/keywords/musical","display_name":"Musical","score":0.46230000257492065},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.40779998898506165},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.4007999897003174},{"id":"https://openalex.org/keywords/controllability","display_name":"Controllability","score":0.3978999853134155},{"id":"https://openalex.org/keywords/pop-music-automation","display_name":"Pop music automation","score":0.39750000834465027}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6320000290870667},{"id":"https://openalex.org/C113194728","wikidata":"https://www.wikidata.org/wiki/Q4130159","display_name":"Musicality","level":3,"score":0.541700005531311},{"id":"https://openalex.org/C2776095079","wikidata":"https://www.wikidata.org/wiki/Q489538","display_name":"The Symbolic","level":2,"score":0.5310999751091003},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.4794999957084656},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4684999883174896},{"id":"https://openalex.org/C558565934","wikidata":"https://www.wikidata.org/wiki/Q2743","display_name":"Musical","level":2,"score":0.46230000257492065},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.40779998898506165},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.4007999897003174},{"id":"https://openalex.org/C48209547","wikidata":"https://www.wikidata.org/wiki/Q1331104","display_name":"Controllability","level":2,"score":0.3978999853134155},{"id":"https://openalex.org/C73520026","wikidata":"https://www.wikidata.org/wiki/Q7229091","display_name":"Pop music automation","level":4,"score":0.39750000834465027},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.3596999943256378},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.34709998965263367},{"id":"https://openalex.org/C188147891","wikidata":"https://www.wikidata.org/wiki/Q147638","display_name":"Cognitive science","level":1,"score":0.33410000801086426},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3095000088214874},{"id":"https://openalex.org/C2776539107","wikidata":"https://www.wikidata.org/wiki/Q176501","display_name":"Timbre","level":3,"score":0.29670000076293945},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.28850001096725464},{"id":"https://openalex.org/C146902061","wikidata":"https://www.wikidata.org/wiki/Q476590","display_name":"Music psychology","level":3,"score":0.27570000290870667},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.27149999141693115},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.27140000462532043},{"id":"https://openalex.org/C88639978","wikidata":"https://www.wikidata.org/wiki/Q233861","display_name":"Musical notation","level":3,"score":0.25690001249313354},{"id":"https://openalex.org/C10864753","wikidata":"https://www.wikidata.org/wiki/Q4353948","display_name":"Music and emotion","level":4,"score":0.25130000710487366}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.24963/ijcai.2025/1134","is_oa":false,"landing_page_url":"https://doi.org/10.24963/ijcai.2025/1134","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Thirty-Fourth International Joint Conference on Artificial Intelligence","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"We":[0],"introduce":[1],"NotaGen,":[2],"a":[3],"symbolic":[4,98,126],"music":[5,51,99,127],"generation":[6,79,100],"model":[7],"aiming":[8],"to":[9,38],"explore":[10],"the":[11,21,40,73,93],"potential":[12],"of":[13,23,50,95],"producing":[14],"high-quality":[15,61],"classical":[16,62],"sheet":[17],"music.":[18],"Inspired":[19],"by":[20],"success":[22],"Large":[24],"Language":[25],"Models":[26],"(LLMs),":[27],"NotaGen":[28,114],"adopts":[29],"pre-training,":[30],"fine-tuning,":[31],"and":[32,55,81,105],"reinforcement":[33,69],"learning":[34],"paradigms":[35],"(henceforth":[36],"referred":[37],"as":[39],"LLM":[41],"training":[42],"paradigms).":[43],"It":[44],"is":[45],"pre-trained":[46],"on":[47,58,65],"1.6M":[48],"pieces":[49],"in":[52,97,125],"ABC":[53],"notation,":[54],"then":[56],"fine-tuned":[57],"approximately":[59],"9K":[60],"compositions":[63],"conditioned":[64],"\"period-composer-instrumentation\"":[66],"prompts.":[67],"For":[68],"learning,":[70],"we":[71],"propose":[72],"CLaMP-DPO":[74,96],"method,":[75],"which":[76],"further":[77],"enhances":[78],"quality":[80],"controllability":[82],"without":[83],"requiring":[84],"human":[85,119],"annotations":[86],"or":[87],"predefined":[88],"rewards.":[89],"Our":[90],"experiments":[91],"demonstrate":[92],"efficacy":[94],"models":[101,117],"with":[102],"different":[103],"architectures":[104],"encoding":[106],"schemes.":[107],"Furthermore,":[108],"subjective":[109],"A/B":[110],"tests":[111],"show":[112],"that":[113],"outperforms":[115],"baseline":[116],"against":[118],"compositions,":[120],"greatly":[121],"advancing":[122],"musical":[123],"aesthetics":[124],"generation.":[128]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":5}],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2025-10-10T00:00:00"}
