{"id":"https://openalex.org/W2752816251","doi":"https://doi.org/10.1109/icme.2017.8019341","title":"Automatic music mood classification by learning cross-media relevance between audio and lyrics","display_name":"Automatic music mood classification by learning cross-media relevance between audio and lyrics","publication_year":2017,"publication_date":"2017-07-01","ids":{"openalex":"https://openalex.org/W2752816251","doi":"https://doi.org/10.1109/icme.2017.8019341","mag":"2752816251"},"language":"en","primary_location":{"id":"doi:10.1109/icme.2017.8019341","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icme.2017.8019341","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE International Conference on Multimedia and Expo (ICME)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5070277096","display_name":"Yu Xiong","orcid":"https://orcid.org/0000-0001-7170-6201"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yu Xiong","raw_affiliation_strings":["State Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006378862","display_name":"Feng Su","orcid":"https://orcid.org/0000-0002-8426-9634"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Feng Su","raw_affiliation_strings":["State Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100417789","display_name":"Qianqian Wang","orcid":"https://orcid.org/0000-0002-7839-9707"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qianqian Wang","raw_affiliation_strings":["State Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5070277096"],"corresponding_institution_ids":["https://openalex.org/I881766915"],"apc_list":null,"apc_paid":null,"fwci":0.5548,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.65562685,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"961","last_page":"966"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10788","display_name":"Neuroscience and Music Perception","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/lyrics","display_name":"Lyrics","score":0.8454740047454834},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6749857068061829},{"id":"https://openalex.org/keywords/mood","display_name":"Mood","score":0.5965878367424011},{"id":"https://openalex.org/keywords/relevance","display_name":"Relevance (law)","score":0.5691261887550354},{"id":"https://openalex.org/keywords/music-information-retrieval","display_name":"Music information retrieval","score":0.5664059519767761},{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.5487037301063538},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5437267422676086},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.48620742559432983},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4504568874835968},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.42179346084594727},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4207437038421631},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.21848708391189575},{"id":"https://openalex.org/keywords/musical","display_name":"Musical","score":0.11382690072059631}],"concepts":[{"id":"https://openalex.org/C2776436406","wikidata":"https://www.wikidata.org/wiki/Q602446","display_name":"Lyrics","level":2,"score":0.8454740047454834},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6749857068061829},{"id":"https://openalex.org/C2780733359","wikidata":"https://www.wikidata.org/wiki/Q331769","display_name":"Mood","level":2,"score":0.5965878367424011},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.5691261887550354},{"id":"https://openalex.org/C2777946086","wikidata":"https://www.wikidata.org/wiki/Q1163335","display_name":"Music information retrieval","level":3,"score":0.5664059519767761},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.5487037301063538},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5437267422676086},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.48620742559432983},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4504568874835968},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.42179346084594727},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4207437038421631},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.21848708391189575},{"id":"https://openalex.org/C558565934","wikidata":"https://www.wikidata.org/wiki/Q2743","display_name":"Musical","level":2,"score":0.11382690072059631},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C124952713","wikidata":"https://www.wikidata.org/wiki/Q8242","display_name":"Literature","level":1,"score":0.0},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C118552586","wikidata":"https://www.wikidata.org/wiki/Q7867","display_name":"Psychiatry","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icme.2017.8019341","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icme.2017.8019341","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE International Conference on Multimedia and Expo (ICME)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7699999809265137,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W78455842","https://openalex.org/W168039245","https://openalex.org/W1488833649","https://openalex.org/W1566337733","https://openalex.org/W1983507146","https://openalex.org/W2070154071","https://openalex.org/W2081580037","https://openalex.org/W2087104069","https://openalex.org/W2104252248","https://openalex.org/W2107430826","https://openalex.org/W2137918516","https://openalex.org/W2144707026","https://openalex.org/W2148600927","https://openalex.org/W2149628368","https://openalex.org/W2238417843","https://openalex.org/W2250539671","https://openalex.org/W2283195891","https://openalex.org/W6606829919","https://openalex.org/W6689708489"],"related_works":["https://openalex.org/W2987280934","https://openalex.org/W2751624083","https://openalex.org/W4241564561","https://openalex.org/W2994064478","https://openalex.org/W2144707026","https://openalex.org/W112239495","https://openalex.org/W2542820473","https://openalex.org/W2515398186","https://openalex.org/W2130068930","https://openalex.org/W2012665501"],"abstract_inverted_index":{"Automatic":[0],"analysis":[1],"of":[2,5,8,11,27,51,54,60,74,96,112,119,133,136,145],"the":[3,49,61,64,68,71,82,88,102,109,125,143,146],"mood":[4,34,50,126],"a":[6,32,42,52,93],"piece":[7,53,118],"music":[9,15,55,89,115,120,137],"is":[10,121],"great":[12],"value":[13],"in":[14,37,87],"searching,":[16],"understanding,":[17],"recommendation":[18],"and":[19,70,84],"some":[20],"other":[21],"music-related":[22],"applications.":[23],"Different":[24],"from":[25],"most":[26],"previous":[28],"methods":[29],"that":[30,106,128],"adopted":[31],"discriminative":[33],"classification":[35],"scheme,":[36],"this":[38,130],"paper,":[39],"we":[40],"propose":[41],"generative":[43],"multimodal":[44,103],"method":[45],"for":[46,80],"automatically":[47],"classifying":[48],"based":[56],"on":[57],"effective":[58,78],"learning":[59],"relevance":[62],"(i.e.":[63],"joint":[65,104,131],"distribution)":[66],"between":[67],"audio":[69],"lyrics":[72,97],"modalities":[73,135],"music.":[75],"We":[76],"present":[77],"algorithms":[79],"computing":[81],"word-to-audio":[83],"word-to-word":[85],"relations":[86],"as":[90,92],"well":[91],"priori":[94],"probability":[95,132],"words,":[98],"which":[99],"altogether":[100],"form":[101],"distribution":[105],"distinctively":[107],"captures":[108],"intrinsic":[110],"characteristic":[111],"one":[113],"specific":[114],"mood.":[116],"A":[117],"then":[122],"classified":[123],"to":[124],"category":[127],"maximizes":[129],"different":[134],"data.":[138],"The":[139],"experiment":[140],"results":[141],"demonstrated":[142],"effectiveness":[144],"proposed":[147],"method.":[148]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2018,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
