{"id":"https://openalex.org/W4403060978","doi":"https://doi.org/10.1109/iotaai62601.2024.10692931","title":"A multi-scale convolutional attention neural network based on residual block downsampling for infant cry classification and detection","display_name":"A multi-scale convolutional attention neural network based on residual block downsampling for infant cry classification and detection","publication_year":2024,"publication_date":"2024-07-26","ids":{"openalex":"https://openalex.org/W4403060978","doi":"https://doi.org/10.1109/iotaai62601.2024.10692931"},"language":"en","primary_location":{"id":"doi:10.1109/iotaai62601.2024.10692931","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iotaai62601.2024.10692931","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 6th International Conference on Internet of Things, Automation and Artificial Intelligence (IoTAAI)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101891276","display_name":"Junjie Yang","orcid":"https://orcid.org/0000-0001-9257-8800"},"institutions":[{"id":"https://openalex.org/I139024713","display_name":"Guangdong University of Technology","ror":"https://ror.org/04azbjn80","country_code":"CN","type":"education","lineage":["https://openalex.org/I139024713"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Junjie Yang","raw_affiliation_strings":["Guangdong University of Technology,Automation School,Guangzhou,China"],"affiliations":[{"raw_affiliation_string":"Guangdong University of Technology,Automation School,Guangzhou,China","institution_ids":["https://openalex.org/I139024713"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100389521","display_name":"Zhenyu Zhang","orcid":"https://orcid.org/0000-0002-2309-3145"},"institutions":[{"id":"https://openalex.org/I139024713","display_name":"Guangdong University of Technology","ror":"https://ror.org/04azbjn80","country_code":"CN","type":"education","lineage":["https://openalex.org/I139024713"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"ZhenYu Zhang","raw_affiliation_strings":["Guangdong University of Technology,Automation School,Guangzhou,China"],"affiliations":[{"raw_affiliation_string":"Guangdong University of Technology,Automation School,Guangzhou,China","institution_ids":["https://openalex.org/I139024713"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068405483","display_name":"Jin Li","orcid":"https://orcid.org/0000-0002-1564-8163"},"institutions":[{"id":"https://openalex.org/I139024713","display_name":"Guangdong University of Technology","ror":"https://ror.org/04azbjn80","country_code":"CN","type":"education","lineage":["https://openalex.org/I139024713"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jin Li","raw_affiliation_strings":["Guangdong University of Technology,Automation School,Guangzhou,China"],"affiliations":[{"raw_affiliation_string":"Guangdong University of Technology,Automation School,Guangzhou,China","institution_ids":["https://openalex.org/I139024713"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100707569","display_name":"Chen Lin","orcid":"https://orcid.org/0000-0002-2275-997X"},"institutions":[{"id":"https://openalex.org/I6507939","display_name":"China United Network Communications Group (China)","ror":"https://ror.org/028w99c90","country_code":"CN","type":"company","lineage":["https://openalex.org/I6507939"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chen Lin","raw_affiliation_strings":["Unicom (Guangdong) Industrial Internet Corporation,Guangzhou,China"],"affiliations":[{"raw_affiliation_string":"Unicom (Guangdong) Industrial Internet Corporation,Guangzhou,China","institution_ids":["https://openalex.org/I6507939"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5101891276"],"corresponding_institution_ids":["https://openalex.org/I139024713"],"apc_list":null,"apc_paid":null,"fwci":2.3378,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.88925422,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"9","last_page":"13"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13289","display_name":"Infant Health and Development","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/3611","display_name":"Pharmacy"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T13289","display_name":"Infant Health and Development","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/3611","display_name":"Pharmacy"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.7369644641876221},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6828771829605103},{"id":"https://openalex.org/keywords/upsampling","display_name":"Upsampling","score":0.6812425851821899},{"id":"https://openalex.org/keywords/residual","display_name":"Residual","score":0.5980198979377747},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5508414506912231},{"id":"https://openalex.org/keywords/block","display_name":"Block (permutation group theory)","score":0.5340529680252075},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.43857550621032715},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.4257637858390808},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.09282433986663818},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.08370453119277954},{"id":"https://openalex.org/keywords/cartography","display_name":"Cartography","score":0.04774734377861023}],"concepts":[{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.7369644641876221},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6828771829605103},{"id":"https://openalex.org/C110384440","wikidata":"https://www.wikidata.org/wiki/Q1143270","display_name":"Upsampling","level":3,"score":0.6812425851821899},{"id":"https://openalex.org/C155512373","wikidata":"https://www.wikidata.org/wiki/Q287450","display_name":"Residual","level":2,"score":0.5980198979377747},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5508414506912231},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.5340529680252075},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.43857550621032715},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.4257637858390808},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09282433986663818},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.08370453119277954},{"id":"https://openalex.org/C58640448","wikidata":"https://www.wikidata.org/wiki/Q42515","display_name":"Cartography","level":1,"score":0.04774734377861023},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iotaai62601.2024.10692931","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iotaai62601.2024.10692931","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 6th International Conference on Internet of Things, Automation and Artificial Intelligence (IoTAAI)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/2","display_name":"Zero hunger","score":0.6600000262260437}],"awards":[],"funders":[{"id":"https://openalex.org/F4320321921","display_name":"Natural Science Foundation of Guangdong Province","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":11,"referenced_works":["https://openalex.org/W2752782242","https://openalex.org/W2760129417","https://openalex.org/W3004557276","https://openalex.org/W3006087478","https://openalex.org/W3011513287","https://openalex.org/W3155168159","https://openalex.org/W3203149322","https://openalex.org/W3208211487","https://openalex.org/W4309627742","https://openalex.org/W4327782440","https://openalex.org/W4385871928"],"related_works":["https://openalex.org/W2062399876","https://openalex.org/W2607795551","https://openalex.org/W3155117723","https://openalex.org/W1991429770","https://openalex.org/W1983892167","https://openalex.org/W2281134365","https://openalex.org/W4310746709","https://openalex.org/W4385574037","https://openalex.org/W4386075645","https://openalex.org/W4306309518"],"abstract_inverted_index":{"The":[0,32,92,138,154,166],"cries":[1],"of":[2,34,56,96,140,160,169,181],"infants":[3],"contain":[4],"rich":[5],"information,":[6,128],"indicating":[7],"hunger,":[8],"tiredness,":[9],"discomfort,":[10],"and":[11,28,48,54,113,129,143,206],"other":[12,188],"physical":[13],"discomforts.":[14],"If":[15],"we":[16,22],"can":[17,23],"understand":[18],"a":[19,39,78,83,99,178],"baby's":[20],"cry,":[21],"quickly":[24],"assess":[25],"their":[26],"state":[27],"take":[29],"appropriate":[30],"action.":[31],"classification":[33,65,69,79],"infant":[35,57],"cry":[36,58],"sounds":[37],"plays":[38],"crucial":[40],"role":[41],"in":[42],"areas":[43],"such":[44],"as":[45],"household":[46],"prompts":[47],"medical":[49],"examinations.":[50],"However,":[51],"the":[52,123,152,170,193,197,203],"diversity":[53],"complexity":[55],"categories":[59],"present":[60],"significant":[61],"challenges":[62],"for":[63],"deep":[64,190],"design.":[66],"To":[67],"improve":[68],"accuracy":[70,159,199],"while":[71,200],"conserving":[72],"computational":[73,179,207],"resources,":[74],"this":[75],"study":[76],"proposes":[77],"method":[80],"based":[81,109],"on":[82,110,162],"multi-scale":[84,114,141],"convolutional":[85],"attention":[86,104,144],"neural":[87],"network":[88],"with":[89,177],"residual":[90,106,111],"downsampling.":[91],"proposed":[93,155,171,194],"model":[94,156,167,195],"consists":[95],"four":[97],"parts:":[98],"feature":[100,127,136],"extraction":[101],"module,":[102,105],"SE":[103],"downsampling":[107,130],"module":[108],"networks,":[112],"convolution":[115,142],"module.":[116],"Mel":[117],"spectrogram":[118],"transformation":[119],"is":[120,131,145],"applied":[121],"to":[122,125,133,147,174,187],"audio":[124],"extract":[126,148],"performed":[132],"obtain":[134],"richer":[135],"representations.":[137],"combination":[139],"used":[146],"key":[149],"information":[150],"from":[151],"features.":[153],"achieves":[157,196],"an":[158],"86.29%":[161],"publicly":[163],"available":[164],"datasets.":[165],"parameters":[168],"algorithm":[172],"amount":[173],"6.67":[175],"million,":[176],"cost":[180,208],"0.66G":[182],"FLOPs":[183],"per":[184],"second.":[185],"Compared":[186],"existing":[189],"learning":[191],"algorithms,":[192],"highest":[198],"considering":[201],"both":[202],"parameter":[204],"quantity":[205],"simultaneously.":[209]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2025-12-27T23:08:20.325037","created_date":"2025-10-10T00:00:00"}
