{"id":"https://openalex.org/W4206364333","doi":"https://doi.org/10.1109/icct52962.2021.9658086","title":"Acoustic Scene Classification Using Aggregation of Two-Scale Deep Embeddings","display_name":"Acoustic Scene Classification Using Aggregation of Two-Scale Deep Embeddings","publication_year":2021,"publication_date":"2021-10-13","ids":{"openalex":"https://openalex.org/W4206364333","doi":"https://doi.org/10.1109/icct52962.2021.9658086"},"language":"en","primary_location":{"id":"doi:10.1109/icct52962.2021.9658086","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icct52962.2021.9658086","pdf_url":null,"source":{"id":"https://openalex.org/S4363607878","display_name":"2021 IEEE 21st International Conference on Communication Technology (ICCT)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE 21st International Conference on Communication Technology (ICCT)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5002402546","display_name":"Ho Ka Chon","orcid":null},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Ho Ka Chon","raw_affiliation_strings":["School of Electronic and Information Engineering, South China University of Technology, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic and Information Engineering, South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070863631","display_name":"Yanxiong Li","orcid":"https://orcid.org/0000-0003-4362-1125"},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanxiong Li","raw_affiliation_strings":["School of Electronic and Information Engineering, South China University of Technology, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic and Information Engineering, South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055239917","display_name":"Wenchang Cao","orcid":"https://orcid.org/0009-0008-2790-2983"},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenchang Cao","raw_affiliation_strings":["School of Electronic and Information Engineering, South China University of Technology, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic and Information Engineering, South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074527802","display_name":"Qisheng Huang","orcid":null},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qisheng Huang","raw_affiliation_strings":["School of Electronic and Information Engineering, South China University of Technology, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic and Information Engineering, South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101525745","display_name":"Wei Xie","orcid":"https://orcid.org/0000-0003-1770-8710"},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Xie","raw_affiliation_strings":["School of Electronic and Information Engineering, South China University of Technology, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic and Information Engineering, South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011018489","display_name":"Wenfeng Pang","orcid":"https://orcid.org/0000-0002-9443-7208"},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenfeng Pang","raw_affiliation_strings":["School of Electronic and Information Engineering, South China University of Technology, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic and Information Engineering, South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101963530","display_name":"Jiyue Wang","orcid":"https://orcid.org/0000-0002-2779-5355"},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiyue Wang","raw_affiliation_strings":["School of Electronic and Information Engineering, South China University of Technology, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic and Information Engineering, South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5002402546"],"corresponding_institution_ids":["https://openalex.org/I90610280"],"apc_list":null,"apc_paid":null,"fwci":0.5161,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.67830759,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":"23","issue":null,"first_page":"1341","last_page":"1345"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.9829999804496765,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7385963201522827},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.7113496661186218},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7030045986175537},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.6302127838134766},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.6082216501235962},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.5286638736724854},{"id":"https://openalex.org/keywords/categorization","display_name":"Categorization","score":0.5114473104476929},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.45279961824417114},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.4207113981246948},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.1116953194141388},{"id":"https://openalex.org/keywords/cartography","display_name":"Cartography","score":0.10456022620201111},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.08338943123817444}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7385963201522827},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.7113496661186218},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7030045986175537},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6302127838134766},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.6082216501235962},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.5286638736724854},{"id":"https://openalex.org/C94124525","wikidata":"https://www.wikidata.org/wiki/Q912550","display_name":"Categorization","level":2,"score":0.5114473104476929},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.45279961824417114},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4207113981246948},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.1116953194141388},{"id":"https://openalex.org/C58640448","wikidata":"https://www.wikidata.org/wiki/Q42515","display_name":"Cartography","level":1,"score":0.10456022620201111},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.08338943123817444},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icct52962.2021.9658086","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icct52962.2021.9658086","pdf_url":null,"source":{"id":"https://openalex.org/S4363607878","display_name":"2021 IEEE 21st International Conference on Communication Technology (ICCT)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE 21st International Conference on Communication Technology (ICCT)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4006312882","display_name":null,"funder_award_id":"61771200,62111530145","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7284265120","display_name":null,"funder_award_id":"2021A1515011454","funder_id":"https://openalex.org/F4320337111","funder_display_name":"Basic and Applied Basic Research Foundation of Guangdong Province"},{"id":"https://openalex.org/G7598593291","display_name":null,"funder_award_id":"2021A0505030003","funder_id":"https://openalex.org/F4320335795","funder_display_name":"Science and Technology Planning Project of Guangdong Province"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335795","display_name":"Science and Technology Planning Project of Guangdong Province","ror":null},{"id":"https://openalex.org/F4320337111","display_name":"Basic and Applied Basic Research Foundation of Guangdong Province","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":37,"referenced_works":["https://openalex.org/W2086384421","https://openalex.org/W2105068979","https://openalex.org/W2128437937","https://openalex.org/W2511956680","https://openalex.org/W2571520038","https://openalex.org/W2617002574","https://openalex.org/W2619623002","https://openalex.org/W2775505379","https://openalex.org/W2775794021","https://openalex.org/W2799400564","https://openalex.org/W2820243394","https://openalex.org/W2890718983","https://openalex.org/W2895776009","https://openalex.org/W2902772991","https://openalex.org/W2907743838","https://openalex.org/W2912899030","https://openalex.org/W2937299048","https://openalex.org/W2960236182","https://openalex.org/W2962711843","https://openalex.org/W2980689481","https://openalex.org/W2997084465","https://openalex.org/W3005258917","https://openalex.org/W3012504141","https://openalex.org/W3015530480","https://openalex.org/W3015594652","https://openalex.org/W3015855451","https://openalex.org/W3016227692","https://openalex.org/W3034892239","https://openalex.org/W3041618382","https://openalex.org/W3080193477","https://openalex.org/W3090499079","https://openalex.org/W3160061063","https://openalex.org/W4238186852","https://openalex.org/W4298091485","https://openalex.org/W6747331233","https://openalex.org/W6779341498","https://openalex.org/W6819339640"],"related_works":["https://openalex.org/W3133861977","https://openalex.org/W2731899572","https://openalex.org/W4200173597","https://openalex.org/W3116150086","https://openalex.org/W2999805992","https://openalex.org/W4283589925","https://openalex.org/W3156786002","https://openalex.org/W2738221750","https://openalex.org/W2732542196","https://openalex.org/W3186111093"],"abstract_inverted_index":{"Acoustic":[0,105],"scene":[1,31],"classification":[2,142],"(ASC)":[3],"is":[4,17,159],"a":[5,25,30],"topic":[6],"related":[7],"to":[8,18,154],"the":[9,36,50,57,64,98,118,122,129,132,139,155],"field":[10,65],"of":[11,35,52,59,66,97,104,124,131,141],"machine":[12],"listening":[13],"whose":[14],"important":[15],"role":[16],"recognize":[19],"and":[20,43,102,107,112,146,150],"categorize":[21],"audio":[22],"data":[23],"in":[24,63],"predefined":[26],"label":[27],"which":[28],"describes":[29],"location.":[32],"In":[33],"most":[34],"state-of-the-art":[37],"works":[38],"for":[39],"ASC,":[40],"hand-crafted":[41],"features":[42],"single-scale":[44],"deep":[45,61,77,126],"embeddings":[46,62,78,127],"were":[47],"adopted":[48],"as":[49],"input":[51],"back-end":[53],"classifiers.":[54],"Inspired":[55],"by":[56,74,83,144],"success":[58],"multi-scale":[60],"computer":[67],"vision,":[68],"we":[69],"propose":[70],"an":[71],"ASC":[72,91,133],"method":[73,120,137],"aggregating":[75],"two-scale":[76,125],"that":[79,117],"are":[80],"independently":[81],"learned":[82],"two":[84,94],"convolutional":[85],"neural":[86],"networks":[87],"(CNNs).":[88],"We":[89],"perform":[90],"experiments":[92],"on":[93,100,148],"official":[95],"datasets":[96],"challenge":[99],"Detection":[101],"Classification":[103],"Scenes":[106],"Events":[108],"(DCASE),":[109],"i.e.,":[110],"DCASE-2019":[111,149],"DCASE-2017.":[113],"Experimental":[114],"results":[115],"show":[116],"proposed":[119,136],"using":[121],"aggregation":[123],"improves":[128],"performance":[130],"system.":[134,157],"The":[135],"obtains":[138],"improvement":[140],"accuracies":[143],"0.11":[145],"0.09":[147],"DCASE-2017":[151],"respectively":[152],"compared":[153],"baseline":[156],"Code":[158],"available:":[160],"https://github.com/hokachon/Two-scale-Agg.":[161]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
