{"id":"https://openalex.org/W4401991255","doi":"https://doi.org/10.1109/icmew63481.2024.10645427","title":"Popular Hooks: A Multimodal Dataset of Musical Hooks for Music Understanding and Generation","display_name":"Popular Hooks: A Multimodal Dataset of Musical Hooks for Music Understanding and Generation","publication_year":2024,"publication_date":"2024-07-15","ids":{"openalex":"https://openalex.org/W4401991255","doi":"https://doi.org/10.1109/icmew63481.2024.10645427"},"language":"en","primary_location":{"id":"doi:10.1109/icmew63481.2024.10645427","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icmew63481.2024.10645427","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Multimedia and Expo Workshops (ICMEW)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5074995310","display_name":"Xinda Wu","orcid":null},"institutions":[{"id":"https://openalex.org/I168879160","display_name":"Zhejiang University of Science and Technology","ror":"https://ror.org/05mx0wr29","country_code":"CN","type":"education","lineage":["https://openalex.org/I168879160"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xinda Wu","raw_affiliation_strings":["College of Computer Science and Technology, Zhejiang University,Hangzhou,China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Zhejiang University,Hangzhou,China","institution_ids":["https://openalex.org/I168879160"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115695321","display_name":"Jiaming Wang","orcid":"https://orcid.org/0009-0006-0283-8036"},"institutions":[{"id":"https://openalex.org/I168879160","display_name":"Zhejiang University of Science and Technology","ror":"https://ror.org/05mx0wr29","country_code":"CN","type":"education","lineage":["https://openalex.org/I168879160"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiaming Wang","raw_affiliation_strings":["College of Computer Science and Technology, Zhejiang University,Hangzhou,China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Zhejiang University,Hangzhou,China","institution_ids":["https://openalex.org/I168879160"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102329472","display_name":"Jiaxing Yu","orcid":"https://orcid.org/0000-0002-7762-6082"},"institutions":[{"id":"https://openalex.org/I168879160","display_name":"Zhejiang University of Science and Technology","ror":"https://ror.org/05mx0wr29","country_code":"CN","type":"education","lineage":["https://openalex.org/I168879160"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiaxing Yu","raw_affiliation_strings":["College of Computer Science and Technology, Zhejiang University,Hangzhou,China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Zhejiang University,Hangzhou,China","institution_ids":["https://openalex.org/I168879160"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000186323","display_name":"Tieyao Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I168879160","display_name":"Zhejiang University of Science and Technology","ror":"https://ror.org/05mx0wr29","country_code":"CN","type":"education","lineage":["https://openalex.org/I168879160"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tieyao Zhang","raw_affiliation_strings":["College of Computer Science and Technology, Zhejiang University,Hangzhou,China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Zhejiang University,Hangzhou,China","institution_ids":["https://openalex.org/I168879160"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101577175","display_name":"Kejun Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I168879160","display_name":"Zhejiang University of Science and Technology","ror":"https://ror.org/05mx0wr29","country_code":"CN","type":"education","lineage":["https://openalex.org/I168879160"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kejun Zhang","raw_affiliation_strings":["College of Computer Science and Technology, Zhejiang University,Hangzhou,China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Zhejiang University,Hangzhou,China","institution_ids":["https://openalex.org/I168879160"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5074995310"],"corresponding_institution_ids":["https://openalex.org/I168879160"],"apc_list":null,"apc_paid":null,"fwci":1.1251,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.77374451,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10788","display_name":"Neuroscience and Music Perception","score":0.9952999949455261,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.9925000071525574,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/musical","display_name":"Musical","score":0.7808131575584412},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6795953512191772},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3475133180618286},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.33430689573287964},{"id":"https://openalex.org/keywords/visual-arts","display_name":"Visual arts","score":0.16178423166275024},{"id":"https://openalex.org/keywords/art","display_name":"Art","score":0.1315423846244812}],"concepts":[{"id":"https://openalex.org/C558565934","wikidata":"https://www.wikidata.org/wiki/Q2743","display_name":"Musical","level":2,"score":0.7808131575584412},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6795953512191772},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3475133180618286},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.33430689573287964},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.16178423166275024},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.1315423846244812}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icmew63481.2024.10645427","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icmew63481.2024.10645427","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Multimedia and Expo Workshops (ICMEW)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G111693571","display_name":null,"funder_award_id":"62272409","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W2149628368","https://openalex.org/W2468785836","https://openalex.org/W2475687244","https://openalex.org/W2592535880","https://openalex.org/W2741036097","https://openalex.org/W2759171953","https://openalex.org/W2884558435","https://openalex.org/W2952638691","https://openalex.org/W3085812513","https://openalex.org/W3092850823","https://openalex.org/W3101943858","https://openalex.org/W3173187964","https://openalex.org/W3175663427","https://openalex.org/W3182909996","https://openalex.org/W3190667038","https://openalex.org/W4221167396","https://openalex.org/W4238292067","https://openalex.org/W4243989635","https://openalex.org/W4288095339","https://openalex.org/W4315881822","https://openalex.org/W4372260250","https://openalex.org/W4376607936","https://openalex.org/W4376653414","https://openalex.org/W4377140494","https://openalex.org/W4386942584","https://openalex.org/W4388891078","https://openalex.org/W4390873340","https://openalex.org/W6768893601","https://openalex.org/W6781910838","https://openalex.org/W6798288246","https://openalex.org/W6799448330","https://openalex.org/W6810265253","https://openalex.org/W6846718565","https://openalex.org/W6847363464","https://openalex.org/W6849063711","https://openalex.org/W6853220273","https://openalex.org/W6856191415","https://openalex.org/W6858930701"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052","https://openalex.org/W4402327032","https://openalex.org/W2382290278"],"abstract_inverted_index":{"The":[0],"Internet":[1],"is":[2,17],"rich":[3],"in":[4,9],"unimodal":[5],"music":[6,23,34,49,64,93,114],"data,":[7],"available":[8],"either":[10],"symbolic":[11],"or":[12],"audio":[13],"representations.":[14],"However,":[15],"there":[16],"a":[18,45,90,103],"notable":[19],"scarcity":[20],"of":[21,59,75],"multimodal":[22,48,92],"datasets":[24],"that":[25],"offer":[26],"aligned":[27],"modal":[28],"information":[29],"and":[30,36,67,85,101],"comprehensive":[31],"annotations":[32,74],"for":[33,97],"understanding":[35],"generation.":[37],"In":[38],"this":[39,118],"paper,":[40],"we":[41,88,111],"introduce":[42],"Popular":[43],"Hooks:":[44],"publicly":[46],"accessible":[47],"dataset":[50,71],"comprising":[51],"38,694":[52],"popular":[53],"musical":[54,77],"hooks":[55],"(i.e.,":[56],"memorable":[57],"sections":[58],"songs)":[60],"with":[61],"synchronized":[62],"MIDI,":[63],"video,":[65],"audio,":[66],"lyrics.":[68],"Furthermore,":[69],"the":[70,125],"provides":[72],"detailed":[73],"high-level":[76],"attributes":[78],"such":[79],"as":[80],"tonality,":[81],"structure,":[82],"genre,":[83],"emotion,":[84],"region.":[86],"Specifically,":[87],"leverage":[89],"pre-trained":[91],"emotion":[94,99],"recognition":[95],"framework":[96],"automatic":[98],"labeling":[100],"conduct":[102],"user":[104],"study":[105],"to":[106,123],"assess":[107],"its":[108,121],"accuracy.":[109],"Finally,":[110],"explore":[112],"emotion-conditioned":[113],"generation":[115],"baselines":[116],"using":[117],"dataset,":[119],"demonstrating":[120],"potential":[122],"advance":[124],"field.":[126]},"counts_by_year":[{"year":2025,"cited_by_count":3}],"updated_date":"2025-12-26T23:08:49.675405","created_date":"2025-10-10T00:00:00"}
