{"id":"https://openalex.org/W2402972567","doi":"https://doi.org/10.21437/interspeech.2012-637","title":"Discriminatively trained phoneme confusion model for keyword spotting","display_name":"Discriminatively trained phoneme confusion model for keyword spotting","publication_year":2012,"publication_date":"2012-09-09","ids":{"openalex":"https://openalex.org/W2402972567","doi":"https://doi.org/10.21437/interspeech.2012-637","mag":"2402972567"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2012-637","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2012-637","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2012","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5038666525","display_name":"Panagiota Karanasou","orcid":null},"institutions":[{"id":"https://openalex.org/I4210115485","display_name":"Laboratoire d'Informatique pour la M\u00e9canique et les Sciences de l'Ing\u00e9nieur","ror":"https://ror.org/01raq4x89","country_code":"FR","type":"facility","lineage":["https://openalex.org/I102197404","https://openalex.org/I1294671590","https://openalex.org/I4210115485","https://openalex.org/I4210159245"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Panagiota Karanasou","raw_affiliation_strings":["Laboratoire d'Informatique pour la M\u00e9canique et les Sciences de l'Ing\u00e9nieur"],"affiliations":[{"raw_affiliation_string":"Laboratoire d'Informatique pour la M\u00e9canique et les Sciences de l'Ing\u00e9nieur","institution_ids":["https://openalex.org/I4210115485"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042273299","display_name":"Luk\u00e1\u0161 Burget","orcid":"https://orcid.org/0000-0002-4951-5908"},"institutions":[{"id":"https://openalex.org/I1298353152","display_name":"SRI International","ror":"https://ror.org/05s570m15","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1298353152"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Lukas Burget","raw_affiliation_strings":["SRI-International"],"affiliations":[{"raw_affiliation_string":"SRI-International","institution_ids":["https://openalex.org/I1298353152"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060715364","display_name":"Dimitra Vergyri","orcid":null},"institutions":[{"id":"https://openalex.org/I1298353152","display_name":"SRI International","ror":"https://ror.org/05s570m15","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1298353152"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dimitra Vergyri","raw_affiliation_strings":["SRI-International"],"affiliations":[{"raw_affiliation_string":"SRI-International","institution_ids":["https://openalex.org/I1298353152"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076998541","display_name":"Murat Akbacak","orcid":null},"institutions":[{"id":"https://openalex.org/I1298353152","display_name":"SRI International","ror":"https://ror.org/05s570m15","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1298353152"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Murat Akbacak","raw_affiliation_strings":["SRI-International"],"affiliations":[{"raw_affiliation_string":"SRI-International","institution_ids":["https://openalex.org/I1298353152"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103079610","display_name":"Arindam Mandal","orcid":"https://orcid.org/0000-0001-5944-2733"},"institutions":[{"id":"https://openalex.org/I1298353152","display_name":"SRI International","ror":"https://ror.org/05s570m15","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1298353152"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Arindam Mandal","raw_affiliation_strings":["SRI-International"],"affiliations":[{"raw_affiliation_string":"SRI-International","institution_ids":["https://openalex.org/I1298353152"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5038666525"],"corresponding_institution_ids":["https://openalex.org/I4210115485"],"apc_list":null,"apc_paid":null,"fwci":3.537,"has_fulltext":false,"cited_by_count":15,"citation_normalized_percentile":{"value":0.93244957,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"2434","last_page":"2437"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/keyword-spotting","display_name":"Keyword spotting","score":0.9544458985328674},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8689159154891968},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.817138671875},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6736675500869751},{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.652404248714447},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5740417242050171},{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.5379856824874878},{"id":"https://openalex.org/keywords/confusion","display_name":"Confusion","score":0.5024540424346924},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.4744592607021332},{"id":"https://openalex.org/keywords/spotting","display_name":"Spotting","score":0.470967561006546},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.42695310711860657}],"concepts":[{"id":"https://openalex.org/C2781213101","wikidata":"https://www.wikidata.org/wiki/Q6398558","display_name":"Keyword spotting","level":2,"score":0.9544458985328674},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8689159154891968},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.817138671875},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6736675500869751},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.652404248714447},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5740417242050171},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.5379856824874878},{"id":"https://openalex.org/C2781140086","wikidata":"https://www.wikidata.org/wiki/Q557945","display_name":"Confusion","level":2,"score":0.5024540424346924},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.4744592607021332},{"id":"https://openalex.org/C2779506182","wikidata":"https://www.wikidata.org/wiki/Q7580141","display_name":"Spotting","level":2,"score":0.470967561006546},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.42695310711860657},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C11171543","wikidata":"https://www.wikidata.org/wiki/Q41630","display_name":"Psychoanalysis","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.21437/interspeech.2012-637","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2012-637","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2012","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.299.4496","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.299.4496","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.speech.sri.com/papers/interspeech2012-karanasou-kws.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7300000190734863,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":8,"referenced_works":["https://openalex.org/W49437105","https://openalex.org/W1537729828","https://openalex.org/W1553339574","https://openalex.org/W1582482241","https://openalex.org/W2046932483","https://openalex.org/W2056986588","https://openalex.org/W2154485447","https://openalex.org/W2167338739"],"related_works":["https://openalex.org/W2918559346","https://openalex.org/W2114097550","https://openalex.org/W4286904253","https://openalex.org/W3119978414","https://openalex.org/W2516975559","https://openalex.org/W2545741539","https://openalex.org/W3206647229","https://openalex.org/W1969408022","https://openalex.org/W2000885660","https://openalex.org/W2117995638"],"abstract_inverted_index":{"Keyword":[0],"Spotting":[1],"(KWS)":[2],"aims":[3],"at":[4],"detecting":[5],"speech":[6,21],"segments":[7],"that":[8,81],"contain":[9],"a":[10,20,26,56,66],"given":[11],"query":[12],"within":[13],"large":[14],"amounts":[15],"of":[16,31,34,51,65,87,117],"audio":[17],"data.":[18],"Typically,":[19],"recognizer":[22],"is":[23,36,82,84,91],"involved":[24],"in":[25],"first":[27],"indexing":[28],"step.":[29],"One":[30],"the":[32,49,62,75,85,95,109,115],"challenges":[33],"KWS":[35,67,96],"how":[37],"to":[38,54,73,94],"handle":[39,74],"recognition":[40],"errors":[41],"and":[42,111],"out-of-vocabulary":[43],"(OOV)":[44],"terms.":[45],"This":[46],"work":[47],"proposes":[48],"use":[50,116],"discriminative":[52],"training":[53],"construct":[55],"phoneme":[57],"confusion":[58],"model,":[59],"which":[60,90],"expands":[61],"phonemic":[63,71],"index":[64],"system":[68],"by":[69],"adding":[70],"variation":[72],"abovementioned":[76],"problems.":[77],"The":[78,98],"objective":[79],"function":[80],"optimized":[83],"Figure":[86],"Merit":[88],"(FOM),":[89],"directly":[92],"related":[93],"performance.":[97],"experiments":[99],"conducted":[100],"on":[101,108],"English":[102],"data":[103],"sets":[104],"show":[105],"some":[106],"improvement":[107],"FOM":[110],"are":[112],"promising":[113],"for":[114],"such":[118],"technique.":[119]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2017,"cited_by_count":3},{"year":2016,"cited_by_count":2},{"year":2015,"cited_by_count":3},{"year":2014,"cited_by_count":2},{"year":2013,"cited_by_count":3}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
