{"id":"https://openalex.org/W7147552213","doi":"https://doi.org/10.1109/cnml68938.2026.11453256","title":"Adaptive Efficacy Assessment Method for Music Education via Multimodal Deep Learning Fusion","display_name":"Adaptive Efficacy Assessment Method for Music Education via Multimodal Deep Learning Fusion","publication_year":2026,"publication_date":"2026-01-30","ids":{"openalex":"https://openalex.org/W7147552213","doi":"https://doi.org/10.1109/cnml68938.2026.11453256"},"language":null,"primary_location":{"id":"doi:10.1109/cnml68938.2026.11453256","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cnml68938.2026.11453256","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 International Conference on Communication Networks and Machine Learning (CNML)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5132703105","display_name":"Wenxiu Li","orcid":null},"institutions":[{"id":"https://openalex.org/I4210089766","display_name":"Technical and Vocational University","ror":"https://ror.org/00854zy02","country_code":"IR","type":"education","lineage":["https://openalex.org/I4210089766"]}],"countries":["IR"],"is_corresponding":true,"raw_author_name":"Wenxiu Li","raw_affiliation_strings":["Laiwu Vocational and Technical College,Shandong,China"],"affiliations":[{"raw_affiliation_string":"Laiwu Vocational and Technical College,Shandong,China","institution_ids":["https://openalex.org/I4210089766"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5132703105"],"corresponding_institution_ids":["https://openalex.org/I4210089766"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.95209581,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1284","last_page":"1290"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11425","display_name":"Diverse Music Education Insights","score":0.33959999680519104,"subfield":{"id":"https://openalex.org/subfields/1210","display_name":"Music"},"field":{"id":"https://openalex.org/fields/12","display_name":"Arts and Humanities"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11425","display_name":"Diverse Music Education Insights","score":0.33959999680519104,"subfield":{"id":"https://openalex.org/subfields/1210","display_name":"Music"},"field":{"id":"https://openalex.org/fields/12","display_name":"Arts and Humanities"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.20340000092983246,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.08470000326633453,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.6665999889373779},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.6028000116348267},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.47269999980926514},{"id":"https://openalex.org/keywords/fusion-mechanism","display_name":"Fusion mechanism","score":0.41029998660087585},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4018000066280365},{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.35589998960494995},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.34119999408721924},{"id":"https://openalex.org/keywords/task-analysis","display_name":"Task analysis","score":0.32850000262260437},{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.31150001287460327}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8064000010490417},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6674000024795532},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.6665999889373779},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.6028000116348267},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5060999989509583},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.47269999980926514},{"id":"https://openalex.org/C173414695","wikidata":"https://www.wikidata.org/wiki/Q5510276","display_name":"Fusion mechanism","level":4,"score":0.41029998660087585},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4018000066280365},{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.35589998960494995},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.34119999408721924},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.32850000262260437},{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.31150001287460327},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.3061000108718872},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.30480000376701355},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.30149999260902405},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.2840000092983246},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.28220000863075256},{"id":"https://openalex.org/C55439883","wikidata":"https://www.wikidata.org/wiki/Q360812","display_name":"Correctness","level":2,"score":0.27709999680519104},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.27469998598098755},{"id":"https://openalex.org/C151319957","wikidata":"https://www.wikidata.org/wiki/Q752739","display_name":"Asynchronous communication","level":2,"score":0.2680000066757202},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.2671000063419342},{"id":"https://openalex.org/C27158222","wikidata":"https://www.wikidata.org/wiki/Q5532422","display_name":"Generalizability theory","level":2,"score":0.25999999046325684},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.2590000033378601},{"id":"https://openalex.org/C2776434776","wikidata":"https://www.wikidata.org/wiki/Q19246213","display_name":"Domain adaptation","level":3,"score":0.257099986076355},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.2554999887943268},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.2547999918460846},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.2538999915122986},{"id":"https://openalex.org/C171836373","wikidata":"https://www.wikidata.org/wiki/Q2266329","display_name":"Linear interpolation","level":3,"score":0.2524000108242035}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cnml68938.2026.11453256","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cnml68938.2026.11453256","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 International Conference on Communication Networks and Machine Learning (CNML)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.8375023603439331,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":11,"referenced_works":["https://openalex.org/W3085812513","https://openalex.org/W4292457823","https://openalex.org/W4295647263","https://openalex.org/W4388263840","https://openalex.org/W4391319721","https://openalex.org/W4403827087","https://openalex.org/W4404603408","https://openalex.org/W4404748858","https://openalex.org/W4409102241","https://openalex.org/W4411992312","https://openalex.org/W7119473516"],"related_works":[],"abstract_inverted_index":{"Addressing":[0],"the":[1,14,47,61,93,126,144,172,183],"limitations":[2],"inherent":[3],"in":[4,98],"traditional":[5],"music":[6],"education":[7],"assessment\u2014specifically":[8],"strong":[9],"subjectivity,":[10],"delayed":[11],"feedback,":[12],"and":[13,108,129,175],"loss":[15],"of":[16,95,188],"technical":[17],"details":[18],"due":[19],"to":[20,54,75,85,91,114,156],"single-modality":[21],"information\u2014this":[22],"paper":[23],"proposes":[24],"a":[25,81,103,130],"novel":[26],"Adaptive":[27,110],"Efficacy":[28],"Assessment":[29],"Method":[30],"(MAAF)":[31],"based":[32,124],"on":[33,125,165],"multimodal":[34],"deep":[35],"learning":[36],"fusion.":[37],"The":[38,179],"method":[39],"constructs":[40],"an":[41,51,109,148],"audio-visual":[42,120],"dual-stream":[43],"neural":[44],"network":[45],"architecture:":[46],"auditory":[48],"channel":[49,63],"utilizes":[50],"improved":[52],"ResNet":[53],"extract":[55],"high-dimensional":[56],"acoustic":[57],"features":[58],"from":[59],"Mel-spectrograms;":[60],"visual":[62],"integrates":[64],"OpenPose":[65],"hand":[66],"keypoint":[67],"detection":[68],"with":[69],"Spatio-Temporal":[70],"Graph":[71],"Convolutional":[72],"Networks":[73],"(ST-GCN)":[74],"capture":[76],"fine-grained":[77],"performance":[78],"techniques,":[79],"employing":[80],"confidence-based":[82],"masking":[83],"strategy":[84,107],"effectively":[86,181],"suppress":[87],"occlusion":[88],"noise.":[89],"Furthermore,":[90,162],"address":[92],"challenge":[94],"spatiotemporal":[96],"asynchrony":[97],"heterogeneous":[99,166],"data,":[100],"we":[101],"design":[102],"linear":[104],"interpolation":[105],"alignment":[106],"Gated":[111],"Attention":[112],"Mechanism":[113],"realize":[115],"dynamic":[116],"weight":[117],"allocation":[118],"for":[119],"features.":[121],"Empirical":[122],"research":[123],"URMP":[127],"dataset":[128],"newly":[131],"constructed":[132],"Real-World":[133],"Classroom":[134],"Dataset":[135],"(RWCD),":[136],"validated":[137],"by":[138],"expert":[139],"reliability":[140],"tests,":[141],"demonstrates":[142],"that":[143,152],"proposed":[145],"model":[146,180],"achieves":[147],"assessment":[149,186],"accuracy":[150],"(PCC=0.898)":[151],"is":[153],"significantly":[154],"superior":[155],"mainstream":[157],"SOTA":[158],"architectures":[159],"(e.g.,":[160,168],"Transformers).":[161],"extensive":[163],"experiments":[164],"instruments":[167],"Piano,":[169],"Guitar)":[170],"confirm":[171],"model's":[173],"robustness":[174],"cross-domain":[176],"generalization":[177],"capabilities.":[178],"simulates":[182],"multi-sensory":[184],"collaborative":[185],"logic":[187],"human":[189],"experts.":[190]},"counts_by_year":[],"updated_date":"2026-04-02T13:53:19.096889","created_date":"2026-04-02T00:00:00"}
