{"id":"https://openalex.org/W2570861022","doi":"https://doi.org/10.1109/taslp.2017.2651361","title":"Modelling Semantic Context of OOV Words in Large Vocabulary Continuous Speech Recognition","display_name":"Modelling Semantic Context of OOV Words in Large Vocabulary Continuous Speech Recognition","publication_year":2017,"publication_date":"2017-01-10","ids":{"openalex":"https://openalex.org/W2570861022","doi":"https://doi.org/10.1109/taslp.2017.2651361","mag":"2570861022"},"language":"en","primary_location":{"id":"doi:10.1109/taslp.2017.2651361","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2017.2651361","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://inria.hal.science/hal-01461617","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5023803850","display_name":"Imran Sheikh","orcid":"https://orcid.org/0000-0001-5041-7398"},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I4210121838","display_name":"Laboratoire Lorrain de Recherche en Informatique et ses Applications","ror":"https://ror.org/02vnf0c38","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I277688954","https://openalex.org/I4210107720","https://openalex.org/I4210121838","https://openalex.org/I4210159245","https://openalex.org/I90183372"]},{"id":"https://openalex.org/I90183372","display_name":"Universit\u00e9 de Lorraine","ror":"https://ror.org/04vfs2w97","country_code":"FR","type":"education","lineage":["https://openalex.org/I90183372"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Imran Sheikh","raw_affiliation_strings":["Multispeech (Inria/CNRS/Universit\u00e9 de Lorraine) Project-Team at LORIA, UMR 7503, Vandoeuvre-l\u00e8s-Nancy, France","MULTISPEECH - Speech Modeling for Facilitating Oral-Based Communication (Centre Inria de l'Universit\u00e9 de Lorraine , 615 Rue du Jardin-Botanique, 54600 Villers-l\u00e8s-Nancy - France)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Multispeech (Inria/CNRS/Universit\u00e9 de Lorraine) Project-Team at LORIA, UMR 7503, Vandoeuvre-l\u00e8s-Nancy, France","institution_ids":["https://openalex.org/I4210121838","https://openalex.org/I90183372","https://openalex.org/I1294671590"]},{"raw_affiliation_string":"MULTISPEECH - Speech Modeling for Facilitating Oral-Based Communication (Centre Inria de l'Universit\u00e9 de Lorraine , 615 Rue du Jardin-Botanique, 54600 Villers-l\u00e8s-Nancy - France)","institution_ids":["https://openalex.org/I90183372"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046546502","display_name":"Dominique Fohr","orcid":null},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I4210121838","display_name":"Laboratoire Lorrain de Recherche en Informatique et ses Applications","ror":"https://ror.org/02vnf0c38","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I277688954","https://openalex.org/I4210107720","https://openalex.org/I4210121838","https://openalex.org/I4210159245","https://openalex.org/I90183372"]},{"id":"https://openalex.org/I90183372","display_name":"Universit\u00e9 de Lorraine","ror":"https://ror.org/04vfs2w97","country_code":"FR","type":"education","lineage":["https://openalex.org/I90183372"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Dominique Fohr","raw_affiliation_strings":["Multispeech (Inria/CNRS/Universit\u00e9 de Lorraine) Project-Team at LORIA, UMR 7503, Vandoeuvre-l\u00e8s-Nancy, France","MULTISPEECH - Speech Modeling for Facilitating Oral-Based Communication (Centre Inria de l'Universit\u00e9 de Lorraine , 615 Rue du Jardin-Botanique, 54600 Villers-l\u00e8s-Nancy - France)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Multispeech (Inria/CNRS/Universit\u00e9 de Lorraine) Project-Team at LORIA, UMR 7503, Vandoeuvre-l\u00e8s-Nancy, France","institution_ids":["https://openalex.org/I4210121838","https://openalex.org/I90183372","https://openalex.org/I1294671590"]},{"raw_affiliation_string":"MULTISPEECH - Speech Modeling for Facilitating Oral-Based Communication (Centre Inria de l'Universit\u00e9 de Lorraine , 615 Rue du Jardin-Botanique, 54600 Villers-l\u00e8s-Nancy - France)","institution_ids":["https://openalex.org/I90183372"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073463405","display_name":"Irina Illina","orcid":"https://orcid.org/0000-0003-2598-4643"},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I4210121838","display_name":"Laboratoire Lorrain de Recherche en Informatique et ses Applications","ror":"https://ror.org/02vnf0c38","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I277688954","https://openalex.org/I4210107720","https://openalex.org/I4210121838","https://openalex.org/I4210159245","https://openalex.org/I90183372"]},{"id":"https://openalex.org/I90183372","display_name":"Universit\u00e9 de Lorraine","ror":"https://ror.org/04vfs2w97","country_code":"FR","type":"education","lineage":["https://openalex.org/I90183372"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Irina Illina","raw_affiliation_strings":["Multispeech (Inria/CNRS/Universit\u00e9 de Lorraine) Project-Team at LORIA, UMR 7503, Vandoeuvre-l\u00e8s-Nancy, France","MULTISPEECH - Speech Modeling for Facilitating Oral-Based Communication (Centre Inria de l'Universit\u00e9 de Lorraine , 615 Rue du Jardin-Botanique, 54600 Villers-l\u00e8s-Nancy - France)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Multispeech (Inria/CNRS/Universit\u00e9 de Lorraine) Project-Team at LORIA, UMR 7503, Vandoeuvre-l\u00e8s-Nancy, France","institution_ids":["https://openalex.org/I4210121838","https://openalex.org/I90183372","https://openalex.org/I1294671590"]},{"raw_affiliation_string":"MULTISPEECH - Speech Modeling for Facilitating Oral-Based Communication (Centre Inria de l'Universit\u00e9 de Lorraine , 615 Rue du Jardin-Botanique, 54600 Villers-l\u00e8s-Nancy - France)","institution_ids":["https://openalex.org/I90183372"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5050508708","display_name":"Georges Linar\u00e8s","orcid":"https://orcid.org/0000-0001-8049-9056"},"institutions":[{"id":"https://openalex.org/I198415970","display_name":"Universit\u00e9 d'Avignon et des Pays de Vaucluse","ror":"https://ror.org/00mfpxb84","country_code":"FR","type":"education","lineage":["https://openalex.org/I198415970"]},{"id":"https://openalex.org/I4210119991","display_name":"Laboratoire Informatique d'Avignon","ror":"https://ror.org/02n399288","country_code":"FR","type":"facility","lineage":["https://openalex.org/I198415970","https://openalex.org/I4210119991"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Georges Linares","raw_affiliation_strings":["Laboratoire d'Informatique d'Avignon, University of Avignon, Avignon, France","LIA - Laboratoire Informatique d'Avignon (339 Chemin des Meinajaries Agroparc BP 1228 84911 Avignon cedex 9 - France)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Laboratoire d'Informatique d'Avignon, University of Avignon, Avignon, France","institution_ids":["https://openalex.org/I4210119991","https://openalex.org/I198415970"]},{"raw_affiliation_string":"LIA - Laboratoire Informatique d'Avignon (339 Chemin des Meinajaries Agroparc BP 1228 84911 Avignon cedex 9 - France)","institution_ids":["https://openalex.org/I4210119991"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.6849,"has_fulltext":false,"cited_by_count":21,"citation_normalized_percentile":{"value":0.92120249,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"25","issue":"3","first_page":"598","last_page":"610"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8886187076568604},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6518664360046387},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6299275755882263},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6282029151916504},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.6097409129142761},{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.5696144104003906},{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.5358765125274658},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.5332649946212769},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5263534784317017},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.4742687940597534},{"id":"https://openalex.org/keywords/context-model","display_name":"Context model","score":0.4548400938510895},{"id":"https://openalex.org/keywords/latent-dirichlet-allocation","display_name":"Latent Dirichlet allocation","score":0.4527169167995453},{"id":"https://openalex.org/keywords/topic-model","display_name":"Topic model","score":0.2655312418937683},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.07219496369361877}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8886187076568604},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6518664360046387},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6299275755882263},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6282029151916504},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6097409129142761},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.5696144104003906},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.5358765125274658},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.5332649946212769},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5263534784317017},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.4742687940597534},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.4548400938510895},{"id":"https://openalex.org/C500882744","wikidata":"https://www.wikidata.org/wiki/Q269236","display_name":"Latent Dirichlet allocation","level":3,"score":0.4527169167995453},{"id":"https://openalex.org/C171686336","wikidata":"https://www.wikidata.org/wiki/Q3532085","display_name":"Topic model","level":2,"score":0.2655312418937683},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.07219496369361877},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/taslp.2017.2651361","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2017.2651361","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},{"id":"pmh:oai:HAL:hal-01461617v1","is_oa":true,"landing_page_url":"https://inria.hal.science/hal-01461617","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech and Language Processing, 2017, 25 (3), pp.598 - 610. &#x27E8;10.1109/TASLP.2017.2651361&#x27E9;","raw_type":"Journal articles"}],"best_oa_location":{"id":"pmh:oai:HAL:hal-01461617v1","is_oa":true,"landing_page_url":"https://inria.hal.science/hal-01461617","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech and Language Processing, 2017, 25 (3), pp.598 - 610. &#x27E8;10.1109/TASLP.2017.2651361&#x27E9;","raw_type":"Journal articles"},"sustainable_development_goals":[{"score":0.6100000143051147,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[{"id":"https://openalex.org/G6073750246","display_name":"Exploitation of context for proper names recognition in the diachronic audio documents","funder_award_id":"ANR-12-BS02-0009","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"}],"funders":[{"id":"https://openalex.org/F4320320883","display_name":"Agence Nationale de la Recherche","ror":"https://ror.org/00rbzpz17"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":119,"referenced_works":["https://openalex.org/W1370891","https://openalex.org/W6908809","https://openalex.org/W46233444","https://openalex.org/W51407305","https://openalex.org/W54232710","https://openalex.org/W58893626","https://openalex.org/W72347498","https://openalex.org/W81527949","https://openalex.org/W103603550","https://openalex.org/W109583113","https://openalex.org/W119112377","https://openalex.org/W151556337","https://openalex.org/W626798658","https://openalex.org/W1488211819","https://openalex.org/W1514535095","https://openalex.org/W1521958654","https://openalex.org/W1524333225","https://openalex.org/W1524340867","https://openalex.org/W1528022942","https://openalex.org/W1532325895","https://openalex.org/W1554187497","https://openalex.org/W1614298861","https://openalex.org/W1631260214","https://openalex.org/W1662133657","https://openalex.org/W1806891645","https://openalex.org/W1832693441","https://openalex.org/W1880262756","https://openalex.org/W1983032739","https://openalex.org/W1984251878","https://openalex.org/W1986573365","https://openalex.org/W1990190154","https://openalex.org/W2001082470","https://openalex.org/W2035573568","https://openalex.org/W2076762622","https://openalex.org/W2086061098","https://openalex.org/W2090755665","https://openalex.org/W2095705004","https://openalex.org/W2100068632","https://openalex.org/W2103587173","https://openalex.org/W2105660309","https://openalex.org/W2120615054","https://openalex.org/W2125573226","https://openalex.org/W2131571251","https://openalex.org/W2133564696","https://openalex.org/W2135535719","https://openalex.org/W2138649166","https://openalex.org/W2140833774","https://openalex.org/W2146688305","https://openalex.org/W2147152072","https://openalex.org/W2153579005","https://openalex.org/W2154304724","https://openalex.org/W2170973209","https://openalex.org/W2216973458","https://openalex.org/W2226562530","https://openalex.org/W2250473257","https://openalex.org/W2250539671","https://openalex.org/W2251103205","https://openalex.org/W2251124635","https://openalex.org/W2251803266","https://openalex.org/W2251830157","https://openalex.org/W2251939518","https://openalex.org/W2264898703","https://openalex.org/W2290562648","https://openalex.org/W2291368429","https://openalex.org/W2292819335","https://openalex.org/W2327501763","https://openalex.org/W2399073184","https://openalex.org/W2403088945","https://openalex.org/W2403501951","https://openalex.org/W2407046429","https://openalex.org/W2508297107","https://openalex.org/W2572708339","https://openalex.org/W2800971787","https://openalex.org/W2950577311","https://openalex.org/W2951829787","https://openalex.org/W2952729433","https://openalex.org/W2963042536","https://openalex.org/W2963355447","https://openalex.org/W2963921497","https://openalex.org/W2964308564","https://openalex.org/W3102751229","https://openalex.org/W4213009331","https://openalex.org/W4231510805","https://openalex.org/W4294170691","https://openalex.org/W4297806265","https://openalex.org/W4400537618","https://openalex.org/W6600284362","https://openalex.org/W6602125538","https://openalex.org/W6602231221","https://openalex.org/W6602415096","https://openalex.org/W6602935006","https://openalex.org/W6603270684","https://openalex.org/W6604155191","https://openalex.org/W6604751875","https://openalex.org/W6619939461","https://openalex.org/W6630875275","https://openalex.org/W6631362777","https://openalex.org/W6631534535","https://openalex.org/W6636510571","https://openalex.org/W6636953519","https://openalex.org/W6639565716","https://openalex.org/W6639619044","https://openalex.org/W6675301171","https://openalex.org/W6678656546","https://openalex.org/W6679434410","https://openalex.org/W6680887930","https://openalex.org/W6682691769","https://openalex.org/W6685158001","https://openalex.org/W6689023924","https://openalex.org/W6691459498","https://openalex.org/W6693515496","https://openalex.org/W6696537820","https://openalex.org/W6696910420","https://openalex.org/W6697034289","https://openalex.org/W6712405136","https://openalex.org/W6713325753","https://openalex.org/W6713967003","https://openalex.org/W6738269772","https://openalex.org/W6989537589"],"related_works":["https://openalex.org/W3126382579","https://openalex.org/W3107650560","https://openalex.org/W2810542905","https://openalex.org/W4315588616","https://openalex.org/W4317422773","https://openalex.org/W2888805565","https://openalex.org/W2250993361","https://openalex.org/W2043781532","https://openalex.org/W3096664139","https://openalex.org/W4385890381"],"abstract_inverted_index":{"The":[0],"diachronic":[1,65],"nature":[2],"of":[3,11,24,31,44,61,72,90,96,126,155,221],"broadcast":[4,163],"news":[5,164],"data":[6],"leads":[7],"to":[8,144,148],"the":[9,59,70,73,77,87,91,118,169,175,187,205,214,219,222],"problem":[10,60],"out-of-vocabulary":[12],"(OOV)":[13],"words":[14,26,139,149],"in":[15,64,203],"large":[16],"vocabulary":[17,207],"continuous":[18,113],"speech":[19,200],"recognition":[20,201],"(LVCSR)":[21],"systems.":[22],"Analysis":[23],"OOV":[25,62,81,97,157,216],"reveals":[27],"that":[28,150,168],"a":[29,136,193],"majority":[30],"them":[32],"are":[33,39,83,151,211],"proper":[34],"names":[35],"(PNs).":[36],"However,":[37],"PNs":[38,63,74,82],"important":[40,152],"for":[41,48,153],"automatic":[42,51],"indexing":[43],"audio-video":[45],"content":[46],"and":[47,102,117,131,171,183,189,208],"obtaining":[49],"reliable":[50],"transcriptions.":[52,93],"In":[53],"this":[54],"paper,":[55],"we":[56,99,166],"focus":[57],"on":[58,161,178],"audio":[66],"documents.":[67],"To":[68],"enable":[69],"recovery":[71],"missed":[75],"by":[76,85],"LVCSR":[78,92,206],"system,":[79],"relevant":[80],"retrieved":[84,215],"exploiting":[86],"semantic":[88,103],"context":[89,104,132,224],"For":[94],"retrieval":[95,154],"PNs,":[98,217],"explore":[100],"topic":[101,111],"derived":[105],"from":[106,181],"latent":[107],"Dirichlet":[108],"allocation":[109],"(LDA)":[110],"models,":[112],"word":[114,130],"vector":[115],"representations":[116],"neural":[119,137],"bag-of-words":[120],"(NBOW)":[121],"model":[122,141,210],"which":[123,142,204],"is":[124],"capable":[125],"learning":[127],"task":[128],"specific":[129],"representations.":[133],"We":[134],"propose":[135],"bag-of-weighted":[138],"(NBOW2)":[140],"learns":[143],"assign":[145],"higher":[146],"weights":[147],"an":[156],"PN.":[158],"With":[159],"experiments":[160],"French":[162],"videos,":[165],"show":[167],"NBOW":[170,188],"NBOW2":[172,190],"models":[173,191],"outperform":[174],"methods":[176],"based":[177],"raw":[179],"embeddings":[180],"LDA":[182],"Skip-gram":[184],"models.":[185,225],"Combining":[186],"gives":[192],"faster":[194],"convergence":[195],"during":[196],"training.":[197],"Second":[198],"pass":[199],"experiments,":[202],"language":[209],"updated":[212],"with":[213],"demonstrate":[218],"effectiveness":[220],"proposed":[223]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":4},{"year":2019,"cited_by_count":4},{"year":2018,"cited_by_count":3},{"year":2017,"cited_by_count":2}],"updated_date":"2026-06-22T08:00:12.763002","created_date":"2025-10-10T00:00:00"}
