{"id":"https://openalex.org/W7131220386","doi":"https://doi.org/10.1007/s44163-026-00923-y","title":"Comprehensive evaluation of folk music teaching effects based on multimodal machine learning","display_name":"Comprehensive evaluation of folk music teaching effects based on multimodal machine learning","publication_year":2026,"publication_date":"2026-02-24","ids":{"openalex":"https://openalex.org/W7131220386","doi":"https://doi.org/10.1007/s44163-026-00923-y"},"language":"en","primary_location":{"id":"doi:10.1007/s44163-026-00923-y","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s44163-026-00923-y","pdf_url":null,"source":{"id":"https://openalex.org/S4210220416","display_name":"Discover Artificial Intelligence","issn_l":"2731-0809","issn":["2731-0809"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Discover Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1007/s44163-026-00923-y","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5126697905","display_name":"Aijuan Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I36152291","display_name":"Henan University of Technology","ror":"https://ror.org/05sbgwt55","country_code":"CN","type":"education","lineage":["https://openalex.org/I36152291"]},{"id":"https://openalex.org/I4210155994","display_name":"Zhengzhou Business University","ror":"https://ror.org/05azzk208","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210155994"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Aijuan Zhang","raw_affiliation_strings":["School of Art, Zhengzhou Technology and Business University, Zhengzhou, 451400, Henan, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Art, Zhengzhou Technology and Business University, Zhengzhou, 451400, Henan, China","institution_ids":["https://openalex.org/I4210155994","https://openalex.org/I36152291"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5126697905"],"corresponding_institution_ids":["https://openalex.org/I36152291","https://openalex.org/I4210155994"],"apc_list":{"value":990,"currency":"EUR","value_usd":1067},"apc_paid":{"value":990,"currency":"EUR","value_usd":1067},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.3829588,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"6","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11425","display_name":"Diverse Music Education Insights","score":0.7867000102996826,"subfield":{"id":"https://openalex.org/subfields/1210","display_name":"Music"},"field":{"id":"https://openalex.org/fields/12","display_name":"Arts and Humanities"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11425","display_name":"Diverse Music Education Insights","score":0.7867000102996826,"subfield":{"id":"https://openalex.org/subfields/1210","display_name":"Music"},"field":{"id":"https://openalex.org/fields/12","display_name":"Arts and Humanities"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10788","display_name":"Neuroscience and Music Perception","score":0.08169999718666077,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.03830000013113022,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/gesture","display_name":"Gesture","score":0.6814000010490417},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.46230000257492065},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.460099995136261},{"id":"https://openalex.org/keywords/tone","display_name":"Tone (literature)","score":0.43070000410079956},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.35429999232292175},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.34880000352859497},{"id":"https://openalex.org/keywords/multimodality","display_name":"Multimodality","score":0.3176000118255615},{"id":"https://openalex.org/keywords/curriculum","display_name":"Curriculum","score":0.3172999918460846}],"concepts":[{"id":"https://openalex.org/C207347870","wikidata":"https://www.wikidata.org/wiki/Q371174","display_name":"Gesture","level":2,"score":0.6814000010490417},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6527000069618225},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5044000148773193},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47119998931884766},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.46230000257492065},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.460099995136261},{"id":"https://openalex.org/C2780583480","wikidata":"https://www.wikidata.org/wiki/Q1366327","display_name":"Tone (literature)","level":2,"score":0.43070000410079956},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.35429999232292175},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.34880000352859497},{"id":"https://openalex.org/C2780910867","wikidata":"https://www.wikidata.org/wiki/Q1952416","display_name":"Multimodality","level":2,"score":0.3176000118255615},{"id":"https://openalex.org/C47177190","wikidata":"https://www.wikidata.org/wiki/Q207137","display_name":"Curriculum","level":2,"score":0.3172999918460846},{"id":"https://openalex.org/C88485024","wikidata":"https://www.wikidata.org/wiki/Q1054571","display_name":"Cepstrum","level":2,"score":0.30730000138282776},{"id":"https://openalex.org/C44819458","wikidata":"https://www.wikidata.org/wiki/Q27939","display_name":"Singing","level":2,"score":0.2957000136375427},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.29350000619888306},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.28769999742507935},{"id":"https://openalex.org/C88610354","wikidata":"https://www.wikidata.org/wiki/Q1813494","display_name":"Teaching method","level":2,"score":0.28139999508857727},{"id":"https://openalex.org/C127220857","wikidata":"https://www.wikidata.org/wiki/Q2719318","display_name":"Audio signal processing","level":4,"score":0.27880001068115234},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2759999930858612},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.27079999446868896},{"id":"https://openalex.org/C135641252","wikidata":"https://www.wikidata.org/wiki/Q738567","display_name":"Multimodal interaction","level":2,"score":0.2696000039577484},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.2597000002861023},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.2515000104904175}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1007/s44163-026-00923-y","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s44163-026-00923-y","pdf_url":null,"source":{"id":"https://openalex.org/S4210220416","display_name":"Discover Artificial Intelligence","issn_l":"2731-0809","issn":["2731-0809"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Discover Artificial Intelligence","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:889c90ee6d1e40a0bb32af05e5f58a86","is_oa":true,"landing_page_url":"https://doaj.org/article/889c90ee6d1e40a0bb32af05e5f58a86","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Discover Artificial Intelligence, Vol 6, Iss 1 (2026)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1007/s44163-026-00923-y","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s44163-026-00923-y","pdf_url":null,"source":{"id":"https://openalex.org/S4210220416","display_name":"Discover Artificial Intelligence","issn_l":"2731-0809","issn":["2731-0809"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Discover Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Sustainable cities and communities","score":0.6810252070426941,"id":"https://metadata.un.org/sdg/11"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":23,"referenced_works":["https://openalex.org/W3151035074","https://openalex.org/W3176919888","https://openalex.org/W3193575540","https://openalex.org/W3196189239","https://openalex.org/W3216807142","https://openalex.org/W4220786059","https://openalex.org/W4220866988","https://openalex.org/W4225071736","https://openalex.org/W4285344186","https://openalex.org/W4290613406","https://openalex.org/W4293528120","https://openalex.org/W4320712896","https://openalex.org/W4327597030","https://openalex.org/W4385954199","https://openalex.org/W4387338546","https://openalex.org/W4388263840","https://openalex.org/W4403791324","https://openalex.org/W4403827087","https://openalex.org/W4404603408","https://openalex.org/W4404748858","https://openalex.org/W4409102241","https://openalex.org/W4411543855","https://openalex.org/W7083798832"],"related_works":[],"abstract_inverted_index":{"Folk":[0],"music":[1,73,112,174],"teaching":[2,144,175],"emphasizes":[3],"both":[4,162],"cultural":[5,193,204,230],"preservation":[6],"and":[7,35,56,72,77,94,107,126,145,165,192,203,232],"emotional":[8],"expression,":[9],"making":[10],"its":[11],"evaluation":[12,185,214],"complex.":[13],"Conventional":[14],"single-modality":[15],"methods,":[16],"relying":[17],"only":[18],"on":[19,170],"audio":[20,92],"or":[21],"textual":[22],"feedback,":[23],"often":[24],"fail":[25],"to":[26,59,122,139,156,236],"capture":[27,140],"the":[28],"interplay":[29],"between":[30],"performance":[31],"accuracy,":[32,210,223],"tonal":[33,83,109],"quality,":[34],"student":[36,166],"engagement.":[37],"To":[38],"overcome":[39],"these":[40,154],"limitations,":[41],"this":[42],"study":[43],"proposes":[44],"a":[45,61,171,196],"Hybrid":[46],"Multimodal":[47],"Sentiment-Tone":[48],"Analysis":[49],"(HMSTA)":[50],"framework":[51,65,199],"that":[52,104,181],"integrates":[53,153],"speech,":[54],"music,":[55],"gesture":[57,131,226],"analysis":[58],"provide":[60,157],"holistic":[62],"evaluation.":[63],"The":[64],"employs":[66],"wavelet":[67],"filtering":[68],"for":[69,81,99,200],"noise":[70],"reduction,":[71],"notes":[74,121],"are":[75,89,117],"normalized":[76],"categorized":[78],"into":[79],"types":[80],"consistent":[82],"representation.":[84],"Mel-Frequency":[85],"Cepstral":[86],"Coefficients":[87],"(MFCCs)":[88],"extracted":[90],"from":[91],"signals":[93],"serve":[95],"as":[96],"feature":[97],"inputs":[98],"Convolutional":[100],"Neural":[101],"Networks":[102],"(CNNs)":[103],"classify":[105],"emotions":[106],"analyze":[108],"patterns.":[110],"For":[111],"tone":[113],"evaluation,":[114],"MFCC-based":[115],"features":[116,155],"compared":[118],"against":[119],"reference":[120],"assess":[123],"pitch":[124,190,222],"accuracy":[125,186],"rhythm":[127],"stability.":[128],"In":[129],"parallel,":[130],"engagement":[132],"is":[133],"measured":[134],"using":[135],"CNN-based":[136],"pose":[137],"estimation":[138],"expressive":[141],"movement":[142],"during":[143],"learning":[146],"sessions.":[147],"A":[148],"multimodal":[149,172],"attention-based":[150],"fusion":[151],"model":[152],"synchronized,":[158],"real-time":[159],"assessments":[160],"of":[161,177],"teacher":[163],"delivery":[164],"response.":[167],"Experimental":[168],"validation":[169],"folk":[173],"dataset":[176],"200":[178],"sessions":[179],"demonstrates":[180,208],"HMSTA":[182,207],"achieves":[183],"high":[184],"across":[187],"emotion":[188,218],"recognition,":[189,219],"analysis,":[191,227],"authenticity,":[194,231],"offering":[195],"practical,":[197],"data-driven":[198],"curriculum":[201],"improvement":[202],"heritage":[205],"preservation.":[206],"superior":[209],"averaging":[211],"91.7%":[212],"in":[213,217,221,225,229],"scores,":[215],"89.4%":[216],"93.1%":[220],"90.6%":[224],"91.2%":[228],"reducing":[233],"processing":[234],"time":[235],"10.2":[237],"s":[238],"per":[239],"session.":[240]},"counts_by_year":[],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2026-02-25T00:00:00"}
