{"id":"https://openalex.org/W1708979102","doi":"https://doi.org/10.1109/cit.2004.1357184","title":"Environmental sound recognition by multilayered neural networks","display_name":"Environmental sound recognition by multilayered neural networks","publication_year":2004,"publication_date":"2004-12-23","ids":{"openalex":"https://openalex.org/W1708979102","doi":"https://doi.org/10.1109/cit.2004.1357184","mag":"1708979102"},"language":"en","primary_location":{"id":"doi:10.1109/cit.2004.1357184","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cit.2004.1357184","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The Fourth International Conference onComputer and Information Technology, 2004. CIT '04.","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5067353501","display_name":"Yoshiyuki Toyoda","orcid":null},"institutions":[{"id":"https://openalex.org/I141591182","display_name":"University of Aizu","ror":"https://ror.org/02pg0e883","country_code":"JP","type":"education","lineage":["https://openalex.org/I141591182"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Y. Toyoda","raw_affiliation_strings":["Dept. of Inf. Syst., Aizu Univ., Japan"],"affiliations":[{"raw_affiliation_string":"Dept. of Inf. Syst., Aizu Univ., Japan","institution_ids":["https://openalex.org/I141591182"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033737940","display_name":"Jie Huang","orcid":"https://orcid.org/0000-0002-3518-3404"},"institutions":[{"id":"https://openalex.org/I141591182","display_name":"University of Aizu","ror":"https://ror.org/02pg0e883","country_code":"JP","type":"education","lineage":["https://openalex.org/I141591182"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Jie Huang","raw_affiliation_strings":["School of Computer Science and Egineering, Department of Informations Systems, University of Aizuwakamatsu, Japan","School of Computer Science and Engineering, The University of Aizu"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Egineering, Department of Informations Systems, University of Aizuwakamatsu, Japan","institution_ids":["https://openalex.org/I141591182"]},{"raw_affiliation_string":"School of Computer Science and Engineering, The University of Aizu","institution_ids":["https://openalex.org/I141591182"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009582696","display_name":"Shuxue Ding","orcid":"https://orcid.org/0000-0002-4963-3883"},"institutions":[{"id":"https://openalex.org/I141591182","display_name":"University of Aizu","ror":"https://ror.org/02pg0e883","country_code":"JP","type":"education","lineage":["https://openalex.org/I141591182"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Shuxue Ding","raw_affiliation_strings":["School of Computer Science and Egineering, Department of Informations Systems, University of Aizuwakamatsu, Japan","School of Computer Science and Engineering, The University of Aizu"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Egineering, Department of Informations Systems, University of Aizuwakamatsu, Japan","institution_ids":["https://openalex.org/I141591182"]},{"raw_affiliation_string":"School of Computer Science and Engineering, The University of Aizu","institution_ids":["https://openalex.org/I141591182"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5014714438","display_name":"Yong Liu","orcid":"https://orcid.org/0000-0003-3314-1750"},"institutions":[{"id":"https://openalex.org/I141591182","display_name":"University of Aizu","ror":"https://ror.org/02pg0e883","country_code":"JP","type":"education","lineage":["https://openalex.org/I141591182"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Yong Liu","raw_affiliation_strings":["School of Computer Science and Egineering, Department of Informations Systems, University of Aizuwakamatsu, Japan","School of Computer Science and Engineering, The University of Aizu"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Egineering, Department of Informations Systems, University of Aizuwakamatsu, Japan","institution_ids":["https://openalex.org/I141591182"]},{"raw_affiliation_string":"School of Computer Science and Engineering, The University of Aizu","institution_ids":["https://openalex.org/I141591182"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5067353501"],"corresponding_institution_ids":["https://openalex.org/I141591182"],"apc_list":null,"apc_paid":null,"fwci":1.1428,"has_fulltext":false,"cited_by_count":26,"citation_normalized_percentile":{"value":0.77679131,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"123","last_page":"127"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10822","display_name":"Acoustic Wave Phenomena Research","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7296712398529053},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5878511071205139},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5560893416404724},{"id":"https://openalex.org/keywords/environmental-noise","display_name":"Environmental noise","score":0.5004894733428955},{"id":"https://openalex.org/keywords/multilayer-perceptron","display_name":"Multilayer perceptron","score":0.49796533584594727},{"id":"https://openalex.org/keywords/hidden-markov-model","display_name":"Hidden Markov model","score":0.44511330127716064},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4264912009239197},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.41149812936782837},{"id":"https://openalex.org/keywords/sound","display_name":"Sound (geography)","score":0.40839865803718567},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.36612948775291443},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.34971773624420166},{"id":"https://openalex.org/keywords/acoustics","display_name":"Acoustics","score":0.20834484696388245}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7296712398529053},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5878511071205139},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5560893416404724},{"id":"https://openalex.org/C86781634","wikidata":"https://www.wikidata.org/wiki/Q2478325","display_name":"Environmental noise","level":3,"score":0.5004894733428955},{"id":"https://openalex.org/C179717631","wikidata":"https://www.wikidata.org/wiki/Q2991667","display_name":"Multilayer perceptron","level":3,"score":0.49796533584594727},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.44511330127716064},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4264912009239197},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.41149812936782837},{"id":"https://openalex.org/C203718221","wikidata":"https://www.wikidata.org/wiki/Q491713","display_name":"Sound (geography)","level":2,"score":0.40839865803718567},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.36612948775291443},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.34971773624420166},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.20834484696388245},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cit.2004.1357184","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cit.2004.1357184","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The Fourth International Conference onComputer and Information Technology, 2004. CIT '04.","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/15","display_name":"Life in Land","score":0.47999998927116394}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":3,"referenced_works":["https://openalex.org/W1982466904","https://openalex.org/W2048060899","https://openalex.org/W2058341666"],"related_works":["https://openalex.org/W2364370872","https://openalex.org/W2053269318","https://openalex.org/W2025614924","https://openalex.org/W2294335174","https://openalex.org/W2097963413","https://openalex.org/W3145575561","https://openalex.org/W2001275470","https://openalex.org/W2073996508","https://openalex.org/W1591475660","https://openalex.org/W2164162849"],"abstract_inverted_index":{"Environmental":[0,41],"sound":[1,21,42,61,90,172],"recognition":[2,43,62,167],"is":[3,27,95,181],"an":[4,156,193],"important":[5],"function":[6],"of":[7,38,55,99,116,126,128,133,143,196],"robotic":[8],"audition.":[9],"Although":[10],"HMM-":[11],"or":[12,207],"TDNN-based":[13],"methods":[14,58],"can":[15],"also":[16,64],"be":[17,65,68],"used":[18],"for":[19,59,88,169,192,199],"environmental":[20,39,60,89,117,144,171],"recognition,":[22,25],"unlike":[23],"speech":[24,127],"it":[26],"not":[28,120],"possible":[29],"to":[30,81,186],"create":[31],"a":[32,83,160,197,203,208],"perfect":[33],"database":[34,158,161],"covering":[35],"all":[36],"kinds":[37],"sounds.":[40],"depends":[44],"more":[45],"on":[46,71],"the":[47,57,96,100,104,108,131,140,164,187],"robot":[48,198,206],"computer":[49],"system":[50,87,195],"task.":[51],"From":[52],"this":[53,77],"point":[54],"view,":[56],"must":[63],"task-dependent":[66],"and":[67,74,107,135,159,183,190],"evaluated":[69],"based":[70],"accuracy,":[72],"speed":[73],"simplicity.":[75],"In":[76],"research,":[78],"we":[79],"tried":[80],"use":[82],"multilayered":[84],"perceptron":[85],"NN":[86],"recognition.":[91],"The":[92,114,166,178],"input":[93],"data":[94,173],"one-dimensional":[97],"combination":[98,132],"instantaneous":[101],"spectrum":[102,115],"at":[103],"power":[105,109,134],"peak":[106],"pattern":[110,137],"in":[111],"time":[112],"domain.":[113],"sounds":[118,145],"do":[119],"change":[121],"as":[122,124],"remarkedly":[123],"that":[125],"voice,":[129],"so":[130],"frequency":[136],"will":[138],"retain":[139],"major":[141],"features":[142],"but":[146],"with":[147],"drastically":[148],"reduced":[149],"data.":[150],"Two":[151],"experiments":[152],"were":[153],"conducted":[154],"using":[155],"original":[157],"created":[162],"by":[163],"RWCP.":[165],"rate":[168],"45":[170],"sets":[174],"was":[175],"about":[176],"92%.":[177],"new":[179],"method":[180],"fast":[182],"simple":[184],"compared":[185],"HMM-based":[188],"methods,":[189],"suitable":[191],"on-board":[194],"home":[200],"use,":[201],"e.g.":[202],"security":[204],"monitoring":[205],"home-helper":[209],"robot.":[210]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2019,"cited_by_count":3},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":2},{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":2},{"year":2013,"cited_by_count":2},{"year":2012,"cited_by_count":1}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
