{"id":"https://openalex.org/W2060417883","doi":"https://doi.org/10.1109/apsipa.2013.6694118","title":"Voice activity detection based on density ratio estimation and system combination","display_name":"Voice activity detection based on density ratio estimation and system combination","publication_year":2013,"publication_date":"2013-10-01","ids":{"openalex":"https://openalex.org/W2060417883","doi":"https://doi.org/10.1109/apsipa.2013.6694118","mag":"2060417883"},"language":"en","primary_location":{"id":"doi:10.1109/apsipa.2013.6694118","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apsipa.2013.6694118","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2013 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5022767796","display_name":"Yuuki Tachioka","orcid":"https://orcid.org/0009-0002-0587-2943"},"institutions":[{"id":"https://openalex.org/I4210133125","display_name":"Mitsubishi Electric (Japan)","ror":"https://ror.org/033y26782","country_code":"JP","type":"company","lineage":["https://openalex.org/I1306287861","https://openalex.org/I4210133125"]},{"id":"https://openalex.org/I1306287861","display_name":"Mitsubishi Group (Japan)","ror":"https://ror.org/0234cd281","country_code":"JP","type":"company","lineage":["https://openalex.org/I1306287861"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Yuuki Tachioka","raw_affiliation_strings":["Information Technology R&D Center, Mitsubishi Electric Corporation, Kanagawa, Japan","Inf. Technol. R & D Center, Mitsubishi Electr. Corp., Kanagawa, Japan"],"affiliations":[{"raw_affiliation_string":"Information Technology R&D Center, Mitsubishi Electric Corporation, Kanagawa, Japan","institution_ids":["https://openalex.org/I4210133125"]},{"raw_affiliation_string":"Inf. Technol. R & D Center, Mitsubishi Electr. Corp., Kanagawa, Japan","institution_ids":["https://openalex.org/I1306287861"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112393630","display_name":"Toshiyuki Hanazawa","orcid":null},"institutions":[{"id":"https://openalex.org/I1306287861","display_name":"Mitsubishi Group (Japan)","ror":"https://ror.org/0234cd281","country_code":"JP","type":"company","lineage":["https://openalex.org/I1306287861"]},{"id":"https://openalex.org/I4210133125","display_name":"Mitsubishi Electric (Japan)","ror":"https://ror.org/033y26782","country_code":"JP","type":"company","lineage":["https://openalex.org/I1306287861","https://openalex.org/I4210133125"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Toshiyuki Hanazawa","raw_affiliation_strings":["Information Technology R&D Center, Mitsubishi Electric Corporation, Kanagawa, Japan","Inf. Technol. R & D Center, Mitsubishi Electr. Corp., Kanagawa, Japan"],"affiliations":[{"raw_affiliation_string":"Information Technology R&D Center, Mitsubishi Electric Corporation, Kanagawa, Japan","institution_ids":["https://openalex.org/I4210133125"]},{"raw_affiliation_string":"Inf. Technol. R & D Center, Mitsubishi Electr. Corp., Kanagawa, Japan","institution_ids":["https://openalex.org/I1306287861"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102253712","display_name":"Tomohiro Narita","orcid":null},"institutions":[{"id":"https://openalex.org/I4210133125","display_name":"Mitsubishi Electric (Japan)","ror":"https://ror.org/033y26782","country_code":"JP","type":"company","lineage":["https://openalex.org/I1306287861","https://openalex.org/I4210133125"]},{"id":"https://openalex.org/I1306287861","display_name":"Mitsubishi Group (Japan)","ror":"https://ror.org/0234cd281","country_code":"JP","type":"company","lineage":["https://openalex.org/I1306287861"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Tomohiro Narita","raw_affiliation_strings":["Information Technology R&D Center, Mitsubishi Electric Corporation, Kanagawa, Japan","Inf. Technol. R & D Center, Mitsubishi Electr. Corp., Kanagawa, Japan"],"affiliations":[{"raw_affiliation_string":"Information Technology R&D Center, Mitsubishi Electric Corporation, Kanagawa, Japan","institution_ids":["https://openalex.org/I4210133125"]},{"raw_affiliation_string":"Inf. Technol. R & D Center, Mitsubishi Electr. Corp., Kanagawa, Japan","institution_ids":["https://openalex.org/I1306287861"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5055378566","display_name":"Jun Ishii","orcid":"https://orcid.org/0000-0003-2568-515X"},"institutions":[{"id":"https://openalex.org/I4210133125","display_name":"Mitsubishi Electric (Japan)","ror":"https://ror.org/033y26782","country_code":"JP","type":"company","lineage":["https://openalex.org/I1306287861","https://openalex.org/I4210133125"]},{"id":"https://openalex.org/I1306287861","display_name":"Mitsubishi Group (Japan)","ror":"https://ror.org/0234cd281","country_code":"JP","type":"company","lineage":["https://openalex.org/I1306287861"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Jun Ishii","raw_affiliation_strings":["Information Technology R&D Center, Mitsubishi Electric Corporation, Kanagawa, Japan","Inf. Technol. R & D Center, Mitsubishi Electr. Corp., Kanagawa, Japan"],"affiliations":[{"raw_affiliation_string":"Information Technology R&D Center, Mitsubishi Electric Corporation, Kanagawa, Japan","institution_ids":["https://openalex.org/I4210133125"]},{"raw_affiliation_string":"Inf. Technol. R & D Center, Mitsubishi Electr. Corp., Kanagawa, Japan","institution_ids":["https://openalex.org/I1306287861"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5022767796"],"corresponding_institution_ids":["https://openalex.org/I1306287861","https://openalex.org/I4210133125"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.12779665,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"4"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11233","display_name":"Advanced Adaptive Filtering Techniques","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/likelihood-ratio-test","display_name":"Likelihood-ratio test","score":0.8274136185646057},{"id":"https://openalex.org/keywords/kernel-density-estimation","display_name":"Kernel density estimation","score":0.6410145163536072},{"id":"https://openalex.org/keywords/signal-to-noise-ratio","display_name":"Signal-to-noise ratio (imaging)","score":0.6034560799598694},{"id":"https://openalex.org/keywords/density-ratio","display_name":"Density ratio","score":0.5944475531578064},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5697916150093079},{"id":"https://openalex.org/keywords/maximum-likelihood","display_name":"Maximum likelihood","score":0.5119613409042358},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.43624579906463623},{"id":"https://openalex.org/keywords/maximum-likelihood-sequence-estimation","display_name":"Maximum likelihood sequence estimation","score":0.4318048357963562},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.417529821395874},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.41614723205566406},{"id":"https://openalex.org/keywords/likelihood-ratios-in-diagnostic-testing","display_name":"Likelihood ratios in diagnostic testing","score":0.41283899545669556},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.36224690079689026},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3491154909133911},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.3302271366119385},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.15758466720581055},{"id":"https://openalex.org/keywords/receiver-operating-characteristic","display_name":"Receiver operating characteristic","score":0.1037161648273468}],"concepts":[{"id":"https://openalex.org/C9483764","wikidata":"https://www.wikidata.org/wiki/Q585740","display_name":"Likelihood-ratio test","level":2,"score":0.8274136185646057},{"id":"https://openalex.org/C71134354","wikidata":"https://www.wikidata.org/wiki/Q458825","display_name":"Kernel density estimation","level":3,"score":0.6410145163536072},{"id":"https://openalex.org/C13944312","wikidata":"https://www.wikidata.org/wiki/Q7512748","display_name":"Signal-to-noise ratio (imaging)","level":2,"score":0.6034560799598694},{"id":"https://openalex.org/C2776436304","wikidata":"https://www.wikidata.org/wiki/Q30693829","display_name":"Density ratio","level":2,"score":0.5944475531578064},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5697916150093079},{"id":"https://openalex.org/C49781872","wikidata":"https://www.wikidata.org/wiki/Q1045555","display_name":"Maximum likelihood","level":2,"score":0.5119613409042358},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.43624579906463623},{"id":"https://openalex.org/C191462741","wikidata":"https://www.wikidata.org/wiki/Q6795902","display_name":"Maximum likelihood sequence estimation","level":3,"score":0.4318048357963562},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.417529821395874},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.41614723205566406},{"id":"https://openalex.org/C144494922","wikidata":"https://www.wikidata.org/wiki/Q6547272","display_name":"Likelihood ratios in diagnostic testing","level":3,"score":0.41283899545669556},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.36224690079689026},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3491154909133911},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3302271366119385},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.15758466720581055},{"id":"https://openalex.org/C58471807","wikidata":"https://www.wikidata.org/wiki/Q327120","display_name":"Receiver operating characteristic","level":2,"score":0.1037161648273468},{"id":"https://openalex.org/C57879066","wikidata":"https://www.wikidata.org/wiki/Q41217","display_name":"Mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C185429906","wikidata":"https://www.wikidata.org/wiki/Q1130160","display_name":"Estimator","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/apsipa.2013.6694118","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apsipa.2013.6694118","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2013 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.6499999761581421,"display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W129077257","https://openalex.org/W149260027","https://openalex.org/W191108438","https://openalex.org/W638544165","https://openalex.org/W1590861666","https://openalex.org/W2009422037","https://openalex.org/W2032474878","https://openalex.org/W2059520982","https://openalex.org/W2103738385","https://openalex.org/W2108819501","https://openalex.org/W2124611315","https://openalex.org/W2129120544","https://openalex.org/W2172237138","https://openalex.org/W2294819182","https://openalex.org/W6676004468","https://openalex.org/W6696839641"],"related_works":["https://openalex.org/W2064349045","https://openalex.org/W4240323427","https://openalex.org/W2126676767","https://openalex.org/W2151194086","https://openalex.org/W2138137679","https://openalex.org/W2141324124","https://openalex.org/W2060417883","https://openalex.org/W2116709453","https://openalex.org/W2104077770","https://openalex.org/W2432570319"],"abstract_inverted_index":{"We":[0],"propose":[1],"a":[2,81,86],"robust":[3],"voice":[4],"activity":[5],"detection":[6],"(VAD)":[7],"based":[8],"on":[9],"density":[10,73,90,109],"ratio":[11,19,52,74,78,91,110,118],"estimation.":[12],"In":[13],"highly":[14],"noisy":[15,158],"environments,":[16],"the":[17,33,50,72,108,113,116,132,146],"likelihood":[18,34,43,51,61,77,87,117],"test":[20],"(LRT)":[21],"is":[22,58,65,106,122,135,149],"effective.":[23],"Conventional":[24],"LRT":[25],"estimates":[26],"both":[27],"speech":[28,54,121],"and":[29,38,55,83,99,120],"noise":[30,56,100],"models,":[31],"calculates":[32],"of":[35,41,53,62,71,115],"each":[36],"model,":[37],"uses":[39],"ratios":[40],"such":[42],"to":[44,93],"detect":[45],"speech.":[46],"However,":[47],"in":[48,156],"LRT,":[49],"models":[57,64,76],"required,":[59],"whereas":[60],"individual":[63],"not":[66],"necessarily":[67],"required.":[68],"The":[69],"framework":[70],"estimation":[75,92,111],"functions":[79,119],"by":[80],"kernel":[82],"directly":[84],"generates":[85],"ratio.":[88],"Applying":[89],"VAD":[94],"requires":[95],"that":[96,145],"feature":[97],"selection":[98],"adaptation":[101],"must":[102],"be":[103],"considered.":[104],"This":[105,124],"because":[107],"constrains":[112],"shape":[114],"dynamic.":[123],"paper":[125],"addresses":[126],"these":[127],"problems.":[128],"To":[129],"improve":[130],"accuracy,":[131],"proposed":[133,147],"method":[134,148],"combined":[136],"with":[137],"conventional":[138,153],"LRT.":[139],"Experimental":[140],"results":[141],"using":[142],"CENSREC-1-C":[143],"show":[144],"more":[150],"effective":[151],"than":[152],"methods,":[154],"especially":[155],"non-stationary":[157],"environments.":[159]},"counts_by_year":[{"year":2018,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
