{"id":"https://openalex.org/W7158606069","doi":"https://doi.org/10.48550/arxiv.2604.25937","title":"SongBench: A Fine-Grained Multi-Aspect Benchmark for Song Quality Assessment","display_name":"SongBench: A Fine-Grained Multi-Aspect Benchmark for Song Quality Assessment","publication_year":2026,"publication_date":"2026-04-16","ids":{"openalex":"https://openalex.org/W7158606069","doi":"https://doi.org/10.48550/arxiv.2604.25937"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.25937","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.25937","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.25937","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5001469325","display_name":"Dapeng Wu","orcid":"https://orcid.org/0000-0003-1755-0183"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Dapeng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134916567","display_name":"Shun Lei","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lei, Shun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134921450","display_name":"Wei Tan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tan, Wei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134878782","display_name":"Guangzheng Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Guangzheng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102956206","display_name":"Yunzhe Wang","orcid":"https://orcid.org/0000-0002-1755-6430"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Yunzhe","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102222270","display_name":"Huaicheng Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Huaicheng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056321739","display_name":"Lishi Zuo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zuo, Lishi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5134926448","display_name":"Zhiyong Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Zhiyong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.8611999750137329,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.8611999750137329,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.05510000139474869,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.02500000037252903,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.79339998960495},{"id":"https://openalex.org/keywords/granularity","display_name":"Granularity","score":0.7091000080108643},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.6190999746322632},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.6086999773979187},{"id":"https://openalex.org/keywords/quality-assessment","display_name":"Quality assessment","score":0.5361999869346619},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.5095999836921692}],"concepts":[{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.79339998960495},{"id":"https://openalex.org/C177774035","wikidata":"https://www.wikidata.org/wiki/Q1246948","display_name":"Granularity","level":2,"score":0.7091000080108643},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6733999848365784},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.6190999746322632},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.6086999773979187},{"id":"https://openalex.org/C3020001037","wikidata":"https://www.wikidata.org/wiki/Q836575","display_name":"Quality assessment","level":3,"score":0.5361999869346619},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.5095999836921692},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.43619999289512634},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4088999927043915},{"id":"https://openalex.org/C558565934","wikidata":"https://www.wikidata.org/wiki/Q2743","display_name":"Musical","level":2,"score":0.3758000135421753},{"id":"https://openalex.org/C2983311337","wikidata":"https://www.wikidata.org/wiki/Q34379","display_name":"Musical instrument","level":2,"score":0.3179999887943268},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2858999967575073},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.28029999136924744},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.27149999141693115},{"id":"https://openalex.org/C118530786","wikidata":"https://www.wikidata.org/wiki/Q1134732","display_name":"Instrumentation (computer programming)","level":2,"score":0.2669999897480011},{"id":"https://openalex.org/C2984588014","wikidata":"https://www.wikidata.org/wiki/Q730675","display_name":"Quantitative assessment","level":2,"score":0.26579999923706055},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.26260000467300415}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.25937","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.25937","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.25937","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.25937","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Recent":[0],"advancements":[1],"in":[2,84],"Text-to-Song":[3],"generation":[4],"have":[5],"enabled":[6],"realistic":[7],"musical":[8],"content":[9],"production,":[10],"yet":[11],"existing":[12],"evaluation":[13],"benchmarks":[14],"lack":[15],"the":[16,96],"professional":[17,100],"granularity":[18],"to":[19,94],"capture":[20],"multi-dimensional":[21],"aesthetic":[22],"nuances.":[23],"In":[24],"this":[25,50],"paper,":[26],"we":[27,52],"propose":[28],"SongBench,":[29],"a":[30,91],"specialized":[31],"framework":[32],"for":[33],"fine-grained":[34,81],"song":[35,104],"assessment":[36],"across":[37],"seven":[38],"key":[39],"dimensions:":[40],"Vocal,":[41],"Instrument,":[42],"Melody,":[43],"Structure,":[44],"Arrangement,":[45],"Mixing,":[46],"and":[47,101],"Musicality.":[48],"Utilizing":[49],"framework,":[51],"construct":[53],"an":[54],"expert-annotated":[55],"database":[56],"comprising":[57],"11,717":[58],"samples":[59],"from":[60],"state-of-the-art":[61,86],"models,":[62,87],"labeled":[63],"by":[64],"music":[65],"professionals.":[66],"Extensive":[67],"experimental":[68],"results":[69],"demonstrate":[70],"that":[71],"SongBench":[72,88],"achieves":[73],"high":[74],"correlation":[75],"with":[76],"expert":[77],"ratings.":[78],"By":[79],"revealing":[80],"performance":[82],"gaps":[83],"current":[85],"serves":[89],"as":[90],"diagnostic":[92],"benchmark":[93],"steer":[95],"development":[97],"toward":[98],"more":[99],"musically":[102],"coherent":[103],"generation.":[105]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-01T00:00:00"}
