{"id":"https://openalex.org/W2100809072","doi":"https://doi.org/10.1145/2072298.2071949","title":"Document dependent fusion in multimodal music retrieval","display_name":"Document dependent fusion in multimodal music retrieval","publication_year":2011,"publication_date":"2011-11-28","ids":{"openalex":"https://openalex.org/W2100809072","doi":"https://doi.org/10.1145/2072298.2071949","mag":"2100809072"},"language":"en","primary_location":{"id":"doi:10.1145/2072298.2071949","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2072298.2071949","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 19th ACM international conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5115666591","display_name":"Zhonghua Li","orcid":"https://orcid.org/0000-0002-6378-045X"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":true,"raw_author_name":"Zhonghua Li","raw_affiliation_strings":["National University of Singapore, Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"National University of Singapore, Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101423194","display_name":"Bingjun Zhang","orcid":"https://orcid.org/0000-0002-6149-7095"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Bingjun Zhang","raw_affiliation_strings":["National University of Singapore, Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"National University of Singapore, Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100423435","display_name":"Ye Wang","orcid":"https://orcid.org/0000-0002-0123-1260"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Ye Wang","raw_affiliation_strings":["National University of Singapore, Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"National University of Singapore, Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5115666591"],"corresponding_institution_ids":["https://openalex.org/I165932596"],"apc_list":null,"apc_paid":null,"fwci":0.312,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.56705056,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1105","last_page":"1108"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9890000224113464,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9854999780654907,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7418701648712158},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.7243615984916687},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.6048092842102051},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4881013333797455},{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.4637181758880615},{"id":"https://openalex.org/keywords/sensor-fusion","display_name":"Sensor fusion","score":0.4398385286331177},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.36633533239364624},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.36402833461761475}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7418701648712158},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.7243615984916687},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.6048092842102051},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4881013333797455},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.4637181758880615},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.4398385286331177},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.36633533239364624},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.36402833461761475},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1145/2072298.2071949","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2072298.2071949","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 19th ACM international conference on Multimedia","raw_type":"proceedings-article"},{"id":"pmh:oai:scholarbank.nus.edu.sg:10635/41360","is_oa":false,"landing_page_url":"http://scholarbank.nus.edu.sg/handle/10635/41360","pdf_url":null,"source":{"id":"https://openalex.org/S7407052290","display_name":"National University of Singapore","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Scopus","raw_type":"Conference Paper"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.689.9835","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.689.9835","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.comp.nus.edu.sg/%7Ewangye/papers/1.Audio_and_Music_Analysis_and_Retrieval/2011_Document_Dependent_Fusion_in_Multimodal_Music_Retrieval.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321026","display_name":"Ministry of Earth Sciences","ror":"https://ror.org/013cf5k59"},{"id":"https://openalex.org/F4320322724","display_name":"Ministry of Education, India","ror":"https://ror.org/048xjjh50"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":10,"referenced_works":["https://openalex.org/W1482214997","https://openalex.org/W1992778361","https://openalex.org/W2031602671","https://openalex.org/W2033485987","https://openalex.org/W2078396654","https://openalex.org/W2090561883","https://openalex.org/W2098162425","https://openalex.org/W2157059464","https://openalex.org/W2184848982","https://openalex.org/W6674809819"],"related_works":["https://openalex.org/W2185469136","https://openalex.org/W2011264131","https://openalex.org/W4306353150","https://openalex.org/W2026860389","https://openalex.org/W8219677","https://openalex.org/W2132659060","https://openalex.org/W2031992971","https://openalex.org/W3214791684","https://openalex.org/W2353265673","https://openalex.org/W2152662039"],"abstract_inverted_index":{"In":[0],"this":[1],"paper,":[2],"we":[3,31],"propose":[4],"a":[5,33,65,73,79],"novel":[6],"multimodal":[7,60],"fusion":[8,12,26,61,92,96,119],"framework,":[9],"document":[10,23,34,47,71],"dependent":[11,95],"(DDF),":[13],"which":[14],"derives":[15],"the":[16,25,39,85,114],"optimal":[17],"combination":[18,67],"strategy":[19,68],"for":[20,69],"each":[21,29,70],"individual":[22],"in":[24],"process.":[27],"For":[28],"document,":[30],"derive":[32],"weight":[35,48],"vector":[36,49],"by":[37],"estimating":[38],"descriptive":[40],"abilities":[41],"of":[42,88,117],"its":[43],"different":[44],"modalities.":[45],"The":[46],"also":[50],"enables":[51],"our":[52],"framework":[53],"to":[54,83],"be":[55],"easily":[56],"integrated":[57],"with":[58,104],"existing":[59],"schemes,":[62],"and":[63,93,98],"achieve":[64],"better":[66],"given":[72],"query.":[74],"Experiments":[75],"are":[76],"conducted":[77],"on":[78],"17174-song":[80],"music":[81],"database":[82],"compare":[84],"retrieval":[86,115],"accuracy":[87],"traditional":[89],"query":[90,94],"independent":[91],"approaches,":[97],"that":[99,109],"obtained":[100],"after":[101],"integrating":[102],"DDF":[103,110],"them.":[105],"Experimental":[106],"results":[107],"indicate":[108],"can":[111],"significantly":[112],"improve":[113],"performance":[116],"current":[118],"approaches.":[120]},"counts_by_year":[{"year":2016,"cited_by_count":1},{"year":2013,"cited_by_count":1}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
