{"id":"https://openalex.org/W7117470416","doi":"https://doi.org/10.1109/dicta68720.2025.11302499","title":"Understanding Non-Verbal Vocalizations from Minimally-Verbal Autistic Individuals: A Transfer Learning Approach","display_name":"Understanding Non-Verbal Vocalizations from Minimally-Verbal Autistic Individuals: A Transfer Learning Approach","publication_year":2025,"publication_date":"2025-12-03","ids":{"openalex":"https://openalex.org/W7117470416","doi":"https://doi.org/10.1109/dicta68720.2025.11302499"},"language":null,"primary_location":{"id":"doi:10.1109/dicta68720.2025.11302499","is_oa":false,"landing_page_url":"https://doi.org/10.1109/dicta68720.2025.11302499","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Conference on Digital Image Computing: Techniques and Applications (DICTA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5025763022","display_name":"Anirudh Atmakuru","orcid":"https://orcid.org/0000-0003-1448-7334"},"institutions":[{"id":"https://openalex.org/I24603500","display_name":"University of Massachusetts Amherst","ror":"https://ror.org/0072zz521","country_code":"US","type":"education","lineage":["https://openalex.org/I24603500"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Anirudh Atmakuru","raw_affiliation_strings":["University of Massachusetts,Amherst,Massachusetts,USA"],"affiliations":[{"raw_affiliation_string":"University of Massachusetts,Amherst,Massachusetts,USA","institution_ids":["https://openalex.org/I24603500"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120888494","display_name":"Pronab Sarker","orcid":null},"institutions":[{"id":"https://openalex.org/I29894533","display_name":"Charles Darwin University","ror":"https://ror.org/048zcaj52","country_code":"AU","type":"education","lineage":["https://openalex.org/I29894533"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Pronab Sarker","raw_affiliation_strings":["Charles Darwin University,Sydney,Australia"],"affiliations":[{"raw_affiliation_string":"Charles Darwin University,Sydney,Australia","institution_ids":["https://openalex.org/I29894533"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121502813","display_name":"Antu Chowdhury","orcid":null},"institutions":[{"id":"https://openalex.org/I29894533","display_name":"Charles Darwin University","ror":"https://ror.org/048zcaj52","country_code":"AU","type":"education","lineage":["https://openalex.org/I29894533"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Antu Chowdhury","raw_affiliation_strings":["Charles Darwin University,Sydney,Australia"],"affiliations":[{"raw_affiliation_string":"Charles Darwin University,Sydney,Australia","institution_ids":["https://openalex.org/I29894533"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121499431","display_name":"Prabal Dutta Barua","orcid":null},"institutions":[{"id":"https://openalex.org/I177920660","display_name":"Australian College of Physical Education","ror":"https://ror.org/04ze84192","country_code":"AU","type":"education","lineage":["https://openalex.org/I177920660"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Prabal Dutta Barua","raw_affiliation_strings":["Australian International Institute of Higher Education,Sydney,Australia"],"affiliations":[{"raw_affiliation_string":"Australian International Institute of Higher Education,Sydney,Australia","institution_ids":["https://openalex.org/I177920660"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121472030","display_name":"U Rajendra Acharya","orcid":null},"institutions":[{"id":"https://openalex.org/I185523456","display_name":"University of Southern Queensland","ror":"https://ror.org/04sjbnx57","country_code":"AU","type":"education","lineage":["https://openalex.org/I185523456"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"U Rajendra Acharya","raw_affiliation_strings":["University of Southern Queensland,Springfield,Australia"],"affiliations":[{"raw_affiliation_string":"University of Southern Queensland,Springfield,Australia","institution_ids":["https://openalex.org/I185523456"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121483637","display_name":"Abdul Hafeez-Baig","orcid":null},"institutions":[{"id":"https://openalex.org/I185523456","display_name":"University of Southern Queensland","ror":"https://ror.org/04sjbnx57","country_code":"AU","type":"education","lineage":["https://openalex.org/I185523456"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Abdul Hafeez-Baig","raw_affiliation_strings":["University of Southern Queensland,Toowoomba,Australia"],"affiliations":[{"raw_affiliation_string":"University of Southern Queensland,Toowoomba,Australia","institution_ids":["https://openalex.org/I185523456"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5033894707","display_name":"Subrata Chakraborty","orcid":"https://orcid.org/0000-0002-0102-5424"},"institutions":[{"id":"https://openalex.org/I90745801","display_name":"University of New England","ror":"https://ror.org/04r659a56","country_code":"AU","type":"education","lineage":["https://openalex.org/I90745801"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Subrata Chakraborty","raw_affiliation_strings":["University of New England,Armidale,Australia"],"affiliations":[{"raw_affiliation_string":"University of New England,Armidale,Australia","institution_ids":["https://openalex.org/I90745801"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5025763022"],"corresponding_institution_ids":["https://openalex.org/I24603500"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.70756033,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10106","display_name":"Autism Spectrum Disorder Research","score":0.7213000059127808,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10106","display_name":"Autism Spectrum Disorder Research","score":0.7213000059127808,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11519","display_name":"Digital Mental Health Interventions","score":0.04650000110268593,"subfield":{"id":"https://openalex.org/subfields/3202","display_name":"Applied Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.041999999433755875,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/spectrogram","display_name":"Spectrogram","score":0.7394999861717224},{"id":"https://openalex.org/keywords/generalizability-theory","display_name":"Generalizability theory","score":0.6593000292778015},{"id":"https://openalex.org/keywords/transfer-of-learning","display_name":"Transfer of learning","score":0.6349999904632568},{"id":"https://openalex.org/keywords/autism-spectrum-disorder","display_name":"Autism spectrum disorder","score":0.525600016117096},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.4975000023841858},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.48989999294281006}],"concepts":[{"id":"https://openalex.org/C45273575","wikidata":"https://www.wikidata.org/wiki/Q578970","display_name":"Spectrogram","level":2,"score":0.7394999861717224},{"id":"https://openalex.org/C27158222","wikidata":"https://www.wikidata.org/wiki/Q5532422","display_name":"Generalizability theory","level":2,"score":0.6593000292778015},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.6349999904632568},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5360999703407288},{"id":"https://openalex.org/C2778538070","wikidata":"https://www.wikidata.org/wiki/Q1436063","display_name":"Autism spectrum disorder","level":3,"score":0.525600016117096},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5170999765396118},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.4975000023841858},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.48989999294281006},{"id":"https://openalex.org/C205778803","wikidata":"https://www.wikidata.org/wiki/Q38404","display_name":"Autism","level":2,"score":0.47760000824928284},{"id":"https://openalex.org/C145633318","wikidata":"https://www.wikidata.org/wiki/Q207125","display_name":"Nonverbal communication","level":2,"score":0.46799999475479126},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4542999863624573},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4000999927520752},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.35929998755455017},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.3398999869823456},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.2712000012397766},{"id":"https://openalex.org/C102964294","wikidata":"https://www.wikidata.org/wiki/Q4820028","display_name":"Auditory learning","level":3,"score":0.26170000433921814},{"id":"https://openalex.org/C5570062","wikidata":"https://www.wikidata.org/wiki/Q3919817","display_name":"Behavioural sciences","level":2,"score":0.25110000371932983}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/dicta68720.2025.11302499","is_oa":false,"landing_page_url":"https://doi.org/10.1109/dicta68720.2025.11302499","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Conference on Digital Image Computing: Techniques and Applications (DICTA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.8445329070091248}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W1571453946","https://openalex.org/W2016433775","https://openalex.org/W2018368467","https://openalex.org/W2094274886","https://openalex.org/W2110063971","https://openalex.org/W2151305614","https://openalex.org/W2164571174","https://openalex.org/W2194775991","https://openalex.org/W2526050071","https://openalex.org/W2593451766","https://openalex.org/W2598909094","https://openalex.org/W2751841560","https://openalex.org/W2779286524","https://openalex.org/W2900299372","https://openalex.org/W2902092143","https://openalex.org/W2941027961","https://openalex.org/W2962845248","https://openalex.org/W2963163009","https://openalex.org/W2963446712","https://openalex.org/W3020824831","https://openalex.org/W3021253625","https://openalex.org/W3036030074","https://openalex.org/W3114304902","https://openalex.org/W3134122847","https://openalex.org/W3139253241","https://openalex.org/W3157722160","https://openalex.org/W3207601856","https://openalex.org/W4296558688","https://openalex.org/W4311900636","https://openalex.org/W4315436281","https://openalex.org/W4319978494","https://openalex.org/W4385607386","https://openalex.org/W4386918931","https://openalex.org/W4388593578","https://openalex.org/W4396753653","https://openalex.org/W4399096988"],"related_works":[],"abstract_inverted_index":{"Autism":[0],"Spectrum":[1],"Disorder":[2],"(ASD)":[3],"often":[4,20,35],"includes":[5],"challenges":[6],"in":[7,49,110,160,202],"verbal":[8,13],"communication,":[9],"particularly":[10,157],"for":[11,41,59,69,205],"minimally":[12],"(mv*)":[14],"individuals.":[15,208],"Mv*":[16],"individuals":[17,70,122],"with":[18,26,71,184],"ASD":[19,89,207],"find":[21],"it":[22,38,57],"difficult":[23,40],"to":[24,43,61,81,92,101,133],"communicate":[25],"people":[27,42],"since":[28],"their":[29,45],"vocalizations":[30,84,118,165],"are":[31],"highly":[32],"personalized":[33,67],"and":[34,52,65,78,95,105,136,142,155,174,195],"non-verbal,":[36],"making":[37],"extremely":[39],"understand":[44],"needs.":[46],"Recent":[47],"advances":[48],"machine":[50,192],"learning":[51,54,77,140,193],"deep":[53],"have":[55],"made":[56],"possible":[58],"researchers":[60],"explore":[62],"new":[63],"avenues":[64],"provide":[66],"care":[68,204],"ASD.":[72],"This":[73],"research":[74],"explores":[75],"transfer":[76,139],"Mel":[79,134],"spectrograms":[80,135],"classify":[82,164],"nonverbal":[83],"from":[85,119,124],"<tex":[86],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[87],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$\\text{mv}^{*}$</tex>":[88],"individuals,":[90],"aiming":[91],"improve":[93],"understanding":[94],"communication.":[96],"We":[97],"conduct":[98],"three":[99],"experiments":[100,150],"verify":[102],"the":[103,130,197],"robustness":[104],"generalizability":[106],"of":[107,116,188,199],"our":[108],"approach":[109],"different":[111],"setups.":[112],"Using":[113],"a":[114,143],"dataset":[115],"7077":[117],"eight":[120],"mv*":[121,206],"collected":[123],"noisy,":[125],"real-world":[126],"settings,":[127],"we":[128],"convert":[129],"audio":[131],"signals":[132],"evaluate":[137],"six":[138,167],"models":[141],"custom":[144],"convolutional":[145],"neural":[146],"network":[147],"model.":[148],"Our":[149],"demonstrated":[151],"that":[152,178],"DenseNet161,":[153],"ResNet101,":[154],"VGG19,":[156],"when":[158],"combined":[159],"an":[161,185],"ensemble,":[162],"effectively":[163],"into":[166],"categories:":[168],"self-talk,":[169],"frustration,":[170],"delight,":[171],"dysregulation,":[172],"social,":[173],"request.":[175],"Results":[176],"suggest":[177],"this":[179],"ensemble":[180],"achieves":[181],"state-of-the-art":[182],"performance":[183],"F1":[186],"score":[187],"0.79,":[189],"outperforming":[190],"traditional":[191],"methods":[194],"highlighting":[196],"potential":[198],"artificial":[200],"intelligence":[201],"enhancing":[203]},"counts_by_year":[],"updated_date":"2026-02-23T20:09:44.859080","created_date":"2025-12-29T00:00:00"}
