{"id":"https://openalex.org/W2095126095","doi":"https://doi.org/10.1109/apsipa.2013.6694175","title":"Context dependent acoustic keyword spotting using deep neural network","display_name":"Context dependent acoustic keyword spotting using deep neural network","publication_year":2013,"publication_date":"2013-10-01","ids":{"openalex":"https://openalex.org/W2095126095","doi":"https://doi.org/10.1109/apsipa.2013.6694175","mag":"2095126095"},"language":"en","primary_location":{"id":"doi:10.1109/apsipa.2013.6694175","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apsipa.2013.6694175","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2013 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5085034441","display_name":"Guangsen Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":true,"raw_author_name":"Guangsen Wang","raw_affiliation_strings":["School of Computing, National University of Singapore, Singapore","Sch. of Comput. Nat., Univ. of Singapore, Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"School of Computing, National University of Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]},{"raw_affiliation_string":"Sch. of Comput. Nat., Univ. of Singapore, Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5032798707","display_name":"Khe Chai Sim","orcid":"https://orcid.org/0000-0002-0866-2223"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Khe Chai Sim","raw_affiliation_strings":["School of Computing, National University of Singapore, Singapore","Sch. of Comput. Nat., Univ. of Singapore, Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"School of Computing, National University of Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]},{"raw_affiliation_string":"Sch. of Comput. Nat., Univ. of Singapore, Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5085034441"],"corresponding_institution_ids":["https://openalex.org/I165932596"],"apc_list":null,"apc_paid":null,"fwci":0.4809,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.76756022,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"10"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9954000115394592,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8387066125869751},{"id":"https://openalex.org/keywords/keyword-spotting","display_name":"Keyword spotting","score":0.8180428147315979},{"id":"https://openalex.org/keywords/spotting","display_name":"Spotting","score":0.7366750240325928},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.6315685510635376},{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.5870761871337891},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.5399584174156189},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5306870937347412},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5216522812843323},{"id":"https://openalex.org/keywords/phone","display_name":"Phone","score":0.5151070952415466},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5117549896240234},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.49765732884407043},{"id":"https://openalex.org/keywords/context-model","display_name":"Context model","score":0.4747351109981537},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.4473681151866913},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.41454073786735535},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.15744665265083313},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.15297988057136536},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.11782047152519226},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.09039467573165894}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8387066125869751},{"id":"https://openalex.org/C2781213101","wikidata":"https://www.wikidata.org/wiki/Q6398558","display_name":"Keyword spotting","level":2,"score":0.8180428147315979},{"id":"https://openalex.org/C2779506182","wikidata":"https://www.wikidata.org/wiki/Q7580141","display_name":"Spotting","level":2,"score":0.7366750240325928},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.6315685510635376},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.5870761871337891},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.5399584174156189},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5306870937347412},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5216522812843323},{"id":"https://openalex.org/C2778707766","wikidata":"https://www.wikidata.org/wiki/Q202064","display_name":"Phone","level":2,"score":0.5151070952415466},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5117549896240234},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.49765732884407043},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.4747351109981537},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.4473681151866913},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.41454073786735535},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.15744665265083313},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.15297988057136536},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.11782047152519226},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.09039467573165894},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/apsipa.2013.6694175","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apsipa.2013.6694175","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2013 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference","raw_type":"proceedings-article"},{"id":"pmh:oai:scholarbank.nus.edu.sg:10635/78071","is_oa":false,"landing_page_url":"http://scholarbank.nus.edu.sg/handle/10635/78071","pdf_url":null,"source":{"id":"https://openalex.org/S7407052290","display_name":"National University of Singapore","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Scopus","raw_type":"Conference Paper"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5799999833106995,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320320709","display_name":"National Research Foundation Singapore","ror":"https://ror.org/03cpyc314"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W115152891","https://openalex.org/W1488355515","https://openalex.org/W1553004968","https://openalex.org/W1561705024","https://openalex.org/W1984806059","https://openalex.org/W1993882792","https://openalex.org/W2046932483","https://openalex.org/W2056986588","https://openalex.org/W2074671152","https://openalex.org/W2101346879","https://openalex.org/W2135321730","https://openalex.org/W2136922672","https://openalex.org/W2142806759","https://openalex.org/W2145215282","https://openalex.org/W2159436188","https://openalex.org/W2167356925","https://openalex.org/W2336725036","https://openalex.org/W2405666970","https://openalex.org/W2918078540","https://openalex.org/W6604665520","https://openalex.org/W6713568955","https://openalex.org/W6759924013"],"related_works":["https://openalex.org/W2918559346","https://openalex.org/W2114097550","https://openalex.org/W4286904253","https://openalex.org/W3119978414","https://openalex.org/W2516975559","https://openalex.org/W2545741539","https://openalex.org/W3206647229","https://openalex.org/W1969408022","https://openalex.org/W2000885660","https://openalex.org/W2117995638"],"abstract_inverted_index":{"Language":[0],"model":[1,29,91,168,218],"is":[2,30,58,98,220],"an":[3],"essential":[4,221],"component":[5],"of":[6,165],"a":[7,88],"speech":[8],"recogniser.":[9],"It":[10],"provides":[11,170],"the":[12,18,23,33,39,42,46,61,69,79,102,114,117,121,126,137,152,163,166,174,184,192,198,202,207,216,225],"additional":[13],"linguistic":[14],"information":[15,169,219],"to":[16,37,71,135,201,222],"constrain":[17],"search":[19],"space":[20],"and":[21,78,95,125,227],"guide":[22],"decoding.":[24],"In":[25,210],"this":[26],"paper,":[27],"language":[28,90,167,217],"incorporated":[31],"in":[32],"keyword":[34,43,65,72,118,141,146],"spotting":[35,108,142,147,208],"system":[36,190],"provide":[38,85],"contexts":[40,66,181],"for":[41,182],"models":[44],"under":[45],"weighted":[47],"finite":[48],"state":[49],"transducer":[50],"framework.":[51],"A":[52],"context":[53,77,138,176,196],"independent":[54,177],"deep":[55],"neural":[56],"network":[57],"trained":[59,99],"as":[60,136],"acoustic":[62],"model.":[63],"Three":[64,106],"are":[67,110,133,149],"investigated:":[68],"phone":[70,96],"context,":[73],"fixed":[74],"length":[75,81,194],"word":[76,82,94,103,122,127,195],"arbitrary":[80,193],"context.":[83],"To":[84],"these":[86],"contexts,":[87],"hybrid":[89],"with":[92],"both":[93,224],"tokens":[97],"using":[100,191],"only":[101],"n-gram":[104],"count.":[105],"different":[107],"graphs":[109,132],"studied":[111],"depending":[112],"on":[113,151],"involved":[115],"contexts:":[116],"loop":[119,128],"graph,":[120],"fillers":[123,129],"graph":[124,178],"graph.":[130],"These":[131],"referred":[134],"dependent":[139],"(CD)":[140],"graphs.":[143,187],"The":[144,188],"CD":[145,186],"systems":[148],"evaluated":[150],"Broadcasting":[153],"News":[154],"Hub4-97":[155],"F0":[156],"evaluation":[157],"set.":[158],"Experimental":[159],"results":[160],"reveal":[161],"that":[162,215],"incorporation":[164],"performance":[171,200],"gain":[172],"over":[173],"baseline":[175],"without":[179],"any":[180],"all":[183],"three":[185],"best":[189],"has":[197],"comparable":[199],"full":[203],"decoding":[204],"but":[205],"triples":[206],"speed.":[209],"addition,":[211],"error":[212],"analysis":[213],"demonstrates":[214],"reduce":[223],"insertion":[226],"deletion":[228],"errors.":[229]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2017,"cited_by_count":2},{"year":2015,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
