{"id":"https://openalex.org/W4391407078","doi":"https://doi.org/10.1109/tmm.2024.3360695","title":"Drawlody: Sketch-Based Melody Creation With Enhanced Usability and Interpretability","display_name":"Drawlody: Sketch-Based Melody Creation With Enhanced Usability and Interpretability","publication_year":2024,"publication_date":"2024-01-01","ids":{"openalex":"https://openalex.org/W4391407078","doi":"https://doi.org/10.1109/tmm.2024.3360695"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2024.3360695","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2024.3360695","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5061702317","display_name":"Qihao Liang","orcid":"https://orcid.org/0000-0002-3866-6081"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":true,"raw_author_name":"Qihao Liang","raw_affiliation_strings":["School of Computing, National University of Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"School of Computing, National University of Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100423435","display_name":"Ye Wang","orcid":"https://orcid.org/0000-0002-0123-1260"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Ye Wang","raw_affiliation_strings":["School of Computing, National University of Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"School of Computing, National University of Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5061702317"],"corresponding_institution_ids":["https://openalex.org/I165932596"],"apc_list":null,"apc_paid":null,"fwci":1.3109,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.79758183,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"26","issue":null,"first_page":"7074","last_page":"7088"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10788","display_name":"Neuroscience and Music Perception","score":0.9925000071525574,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/melody","display_name":"Melody","score":0.9127600193023682},{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.8389154076576233},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8257792592048645},{"id":"https://openalex.org/keywords/sketch","display_name":"Sketch","score":0.7483230233192444},{"id":"https://openalex.org/keywords/usability","display_name":"Usability","score":0.70004802942276},{"id":"https://openalex.org/keywords/chord","display_name":"Chord (peer-to-peer)","score":0.6845875978469849},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.5299633145332336},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.480714350938797},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.44073230028152466},{"id":"https://openalex.org/keywords/usable","display_name":"USable","score":0.4354100823402405},{"id":"https://openalex.org/keywords/music-information-retrieval","display_name":"Music information retrieval","score":0.43497759103775024},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.40144258737564087},{"id":"https://openalex.org/keywords/musical","display_name":"Musical","score":0.2268446981906891},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.20637813210487366},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.09797826409339905},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.08627155423164368}],"concepts":[{"id":"https://openalex.org/C43803900","wikidata":"https://www.wikidata.org/wiki/Q170412","display_name":"Melody","level":3,"score":0.9127600193023682},{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.8389154076576233},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8257792592048645},{"id":"https://openalex.org/C2779231336","wikidata":"https://www.wikidata.org/wiki/Q7534724","display_name":"Sketch","level":2,"score":0.7483230233192444},{"id":"https://openalex.org/C170130773","wikidata":"https://www.wikidata.org/wiki/Q216378","display_name":"Usability","level":2,"score":0.70004802942276},{"id":"https://openalex.org/C194147245","wikidata":"https://www.wikidata.org/wiki/Q1076368","display_name":"Chord (peer-to-peer)","level":2,"score":0.6845875978469849},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.5299633145332336},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.480714350938797},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44073230028152466},{"id":"https://openalex.org/C2780615836","wikidata":"https://www.wikidata.org/wiki/Q2471869","display_name":"USable","level":2,"score":0.4354100823402405},{"id":"https://openalex.org/C2777946086","wikidata":"https://www.wikidata.org/wiki/Q1163335","display_name":"Music information retrieval","level":3,"score":0.43497759103775024},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.40144258737564087},{"id":"https://openalex.org/C558565934","wikidata":"https://www.wikidata.org/wiki/Q2743","display_name":"Musical","level":2,"score":0.2268446981906891},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.20637813210487366},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.09797826409339905},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.08627155423164368},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2024.3360695","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2024.3360695","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[{"id":"https://openalex.org/G7835538620","display_name":null,"funder_award_id":"MOE-T2EP20120-0012","funder_id":"https://openalex.org/F4320320751","funder_display_name":"Ministry of Education - Singapore"}],"funders":[{"id":"https://openalex.org/F4320320751","display_name":"Ministry of Education - Singapore","ror":"https://ror.org/01kcva023"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":74,"referenced_works":["https://openalex.org/W805008270","https://openalex.org/W1983507146","https://openalex.org/W2139860487","https://openalex.org/W2142996485","https://openalex.org/W2160535745","https://openalex.org/W2166957649","https://openalex.org/W2245166091","https://openalex.org/W2328626131","https://openalex.org/W2338312508","https://openalex.org/W2340600463","https://openalex.org/W2572771584","https://openalex.org/W2594475271","https://openalex.org/W2898827701","https://openalex.org/W2901139351","https://openalex.org/W2901638613","https://openalex.org/W2901662698","https://openalex.org/W2916904544","https://openalex.org/W2945956523","https://openalex.org/W2949950073","https://openalex.org/W2953148995","https://openalex.org/W2955877667","https://openalex.org/W2964110616","https://openalex.org/W2973671566","https://openalex.org/W2997359842","https://openalex.org/W3006654639","https://openalex.org/W3033032256","https://openalex.org/W3047906741","https://openalex.org/W3049272330","https://openalex.org/W3092850823","https://openalex.org/W3092879656","https://openalex.org/W3101246092","https://openalex.org/W3137883189","https://openalex.org/W3161237630","https://openalex.org/W3175663427","https://openalex.org/W3186393076","https://openalex.org/W3201649632","https://openalex.org/W3207290297","https://openalex.org/W3213549365","https://openalex.org/W4200327213","https://openalex.org/W4206908116","https://openalex.org/W4210698306","https://openalex.org/W4213276648","https://openalex.org/W4224933341","https://openalex.org/W4226103472","https://openalex.org/W4285331791","https://openalex.org/W4285737960","https://openalex.org/W4286836754","https://openalex.org/W4304091524","https://openalex.org/W4311118080","https://openalex.org/W4312606165","https://openalex.org/W4312918978","https://openalex.org/W4313227022","https://openalex.org/W4315881822","https://openalex.org/W4317897847","https://openalex.org/W4321597988","https://openalex.org/W4376607936","https://openalex.org/W4376875909","https://openalex.org/W4377371824","https://openalex.org/W4385245566","https://openalex.org/W4385565260","https://openalex.org/W4385763952","https://openalex.org/W6633499030","https://openalex.org/W6703879901","https://openalex.org/W6704344484","https://openalex.org/W6713831496","https://openalex.org/W6734862562","https://openalex.org/W6760601182","https://openalex.org/W6765207196","https://openalex.org/W6765802021","https://openalex.org/W6781972552","https://openalex.org/W6799448330","https://openalex.org/W6801284891","https://openalex.org/W6849063711","https://openalex.org/W6852445011"],"related_works":["https://openalex.org/W2753058862","https://openalex.org/W2547055343","https://openalex.org/W2804082714","https://openalex.org/W2086473573","https://openalex.org/W1566263950","https://openalex.org/W1908769745","https://openalex.org/W2039049596","https://openalex.org/W3134670663","https://openalex.org/W4297791980","https://openalex.org/W2133554502"],"abstract_inverted_index":{"Sketch-based":[0],"melody":[1,12,80,119,131,155,186,209,223,253],"creation":[2,132],"systems":[3,85],"enable":[4],"people":[5,51,179],"to":[6,30,105,110,220],"compose":[7],"melodies":[8,16,90,201],"by":[9,145,228],"converting":[10],"human-sketched":[11,206],"contours":[13,207],"into":[14],"coherent":[15,185],"that":[17],"fit":[18],"the":[19,26,112,168,174,197,217,259],"depicted":[20],"contours.":[21],"This":[22,82,165],"remains":[23],"one":[24,55],"of":[25,114,170,200,258],"most":[27],"intuitive":[28],"approaches":[29],"interactive":[31],"music":[32,193,233],"creation.":[33],"However,":[34],"previous":[35],"studies":[36,58],"are":[37,261],"still":[38],"stagnating":[39],"in":[40,117],"limitations":[41],"regarding":[42],"usability":[43,136,240],"and":[44,52,72,78,93,109,137,202,231,241,251],"interpretability,":[45,250],"which":[46,195],"hinders":[47],"effective":[48],"interactions":[49],"between":[50],"AI.":[53],"For":[54],"thing,":[56],"these":[57,115,123],"entail":[59],"additional":[60],"complex":[61,148],"musical":[62,99,149,181],"conditions":[63],"as":[64,163,216,236,238],"auxiliary":[65],"inputs":[66,108,116],"(e.g.":[67],"chord":[68],"progressions,":[69],"contextual":[70],"melodies,":[71],"predetermined":[73],"rhythms),":[74],"supporting":[75],"only":[76,152],"fixed-length":[77],"rule-based":[79],"generation.":[81,120,210,224],"makes":[83],"existing":[84],"less":[86],"usable,":[87],"with":[88,134],"generated":[89],"lacking":[91],"diversity":[92],"coherence.":[94],"Moreover,":[95],"users":[96],"without":[97,180],"enough":[98],"expertise":[100],"might":[101],"find":[102],"it":[103],"difficult":[104],"define":[106],"appropriate":[107],"interpret":[111],"role":[113,169],"guiding":[118],"To":[121,183],"address":[122],"limitations,":[124],"we":[125,190],"present":[126],"Drawlody,":[127],"a":[128,153,213,239],"novel":[129],"sketch-based":[130],"system":[133,175,260],"enhanced":[135,248],"interpretability.":[138],"Specifically,":[139],"Drawlody":[140,225],"simplifies":[141],"user":[142,171],"input":[143],"requirements":[144],"excluding":[146],"all":[147],"conditions,":[150],"using":[151],"simplified":[154],"contour":[156],"representation":[157],"named":[158],"Generalised":[159],"Melody":[160],"Contour":[161],"(GMC)":[162],"input.":[164],"simplification":[166],"clarifies":[167],"controls,":[172],"making":[173],"more":[176],"usable":[177],"for":[178],"training.":[182],"guide":[184,208],"generation":[187,254],"from":[188],"GMC,":[189],"propose":[191],"FlexMIDI":[192],"representation,":[194],"simulates":[196],"tonal":[198],"structure":[199],"faithfully":[203],"explains":[204],"how":[205],"We":[211],"employ":[212],"CNN-Transformer-based":[214],"architecture":[215],"foundation":[218],"model":[219],"achieve":[221],"arbitrary-length":[222],"is":[226],"evaluated":[227],"both":[229],"objective":[230],"subjective":[232],"quality":[234],"studies,":[235],"well":[237],"interpretability":[242],"study.":[243],"The":[244],"results":[245],"support":[246],"its":[247],"usability,":[249],"high-quality":[252],"capabilities.":[255],"Video":[256],"demos":[257],"presented":[262],"<underline":[263],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[264],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">here</u>":[265],".":[266]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":1}],"updated_date":"2026-03-06T13:50:29.536080","created_date":"2025-10-10T00:00:00"}
