{"id":"https://openalex.org/W2235839570","doi":"https://doi.org/10.1109/asru.2015.7404766","title":"Different word representations and their combination for proper name retrieval from diachronic documents","display_name":"Different word representations and their combination for proper name retrieval from diachronic documents","publication_year":2015,"publication_date":"2015-12-01","ids":{"openalex":"https://openalex.org/W2235839570","doi":"https://doi.org/10.1109/asru.2015.7404766","mag":"2235839570"},"language":"en","primary_location":{"id":"doi:10.1109/asru.2015.7404766","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru.2015.7404766","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2015 IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5073463405","display_name":"Irina Illina","orcid":"https://orcid.org/0000-0003-2598-4643"},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I1326498283","display_name":"Institut national de recherche en sciences et technologies du num\u00e9rique","ror":"https://ror.org/02kvxyf05","country_code":"FR","type":"government","lineage":["https://openalex.org/I1326498283"]},{"id":"https://openalex.org/I4210121838","display_name":"Laboratoire Lorrain de Recherche en Informatique et ses Applications","ror":"https://ror.org/02vnf0c38","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I277688954","https://openalex.org/I4210107720","https://openalex.org/I4210121838","https://openalex.org/I4210159245","https://openalex.org/I90183372"]},{"id":"https://openalex.org/I90183372","display_name":"Universit\u00e9 de Lorraine","ror":"https://ror.org/04vfs2w97","country_code":"FR","type":"education","lineage":["https://openalex.org/I90183372"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Irina Illina","raw_affiliation_strings":["CNRS, LORIA, UMR 7503, France","Inria, France","MultiSpeech team","Universit\u00e9 de Lorraine, LORIA, UMR 7503, France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"CNRS, LORIA, UMR 7503, France","institution_ids":["https://openalex.org/I1294671590","https://openalex.org/I4210121838"]},{"raw_affiliation_string":"Inria, France","institution_ids":["https://openalex.org/I1326498283"]},{"raw_affiliation_string":"MultiSpeech team","institution_ids":[]},{"raw_affiliation_string":"Universit\u00e9 de Lorraine, LORIA, UMR 7503, France","institution_ids":["https://openalex.org/I90183372","https://openalex.org/I4210121838"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5046546502","display_name":"Dominique Fohr","orcid":null},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I1326498283","display_name":"Institut national de recherche en sciences et technologies du num\u00e9rique","ror":"https://ror.org/02kvxyf05","country_code":"FR","type":"government","lineage":["https://openalex.org/I1326498283"]},{"id":"https://openalex.org/I4210121838","display_name":"Laboratoire Lorrain de Recherche en Informatique et ses Applications","ror":"https://ror.org/02vnf0c38","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I277688954","https://openalex.org/I4210107720","https://openalex.org/I4210121838","https://openalex.org/I4210159245","https://openalex.org/I90183372"]},{"id":"https://openalex.org/I90183372","display_name":"Universit\u00e9 de Lorraine","ror":"https://ror.org/04vfs2w97","country_code":"FR","type":"education","lineage":["https://openalex.org/I90183372"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Dominique Fohr","raw_affiliation_strings":["CNRS, LORIA, UMR 7503, France","Inria, France","MultiSpeech team","Universit\u00e9 de Lorraine, LORIA, UMR 7503, France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"CNRS, LORIA, UMR 7503, France","institution_ids":["https://openalex.org/I1294671590","https://openalex.org/I4210121838"]},{"raw_affiliation_string":"Inria, France","institution_ids":["https://openalex.org/I1326498283"]},{"raw_affiliation_string":"MultiSpeech team","institution_ids":[]},{"raw_affiliation_string":"Universit\u00e9 de Lorraine, LORIA, UMR 7503, France","institution_ids":["https://openalex.org/I90183372","https://openalex.org/I4210121838"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.4452,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.7796037,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"3","issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8752726316452026},{"id":"https://openalex.org/keywords/latent-dirichlet-allocation","display_name":"Latent Dirichlet allocation","score":0.7572334408760071},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.7251396775245667},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6946879029273987},{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.5901768207550049},{"id":"https://openalex.org/keywords/topic-model","display_name":"Topic model","score":0.5433550477027893},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.5327605605125427},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.519342303276062},{"id":"https://openalex.org/keywords/complementarity","display_name":"Complementarity (molecular biology)","score":0.4889887571334839},{"id":"https://openalex.org/keywords/document-retrieval","display_name":"Document retrieval","score":0.4588705897331238},{"id":"https://openalex.org/keywords/context-model","display_name":"Context model","score":0.45781010389328003},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.4542752206325531},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.4110441505908966},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3979473412036896},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.37269851565361023},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.1055915355682373}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8752726316452026},{"id":"https://openalex.org/C500882744","wikidata":"https://www.wikidata.org/wiki/Q269236","display_name":"Latent Dirichlet allocation","level":3,"score":0.7572334408760071},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.7251396775245667},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6946879029273987},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.5901768207550049},{"id":"https://openalex.org/C171686336","wikidata":"https://www.wikidata.org/wiki/Q3532085","display_name":"Topic model","level":2,"score":0.5433550477027893},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.5327605605125427},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.519342303276062},{"id":"https://openalex.org/C202269582","wikidata":"https://www.wikidata.org/wiki/Q2644277","display_name":"Complementarity (molecular biology)","level":2,"score":0.4889887571334839},{"id":"https://openalex.org/C161156560","wikidata":"https://www.wikidata.org/wiki/Q1638872","display_name":"Document retrieval","level":2,"score":0.4588705897331238},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.45781010389328003},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.4542752206325531},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.4110441505908966},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3979473412036896},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.37269851565361023},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.1055915355682373},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/asru.2015.7404766","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru.2015.7404766","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2015 IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.8100000023841858,"display_name":"Quality Education"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320320883","display_name":"Agence Nationale de la Recherche","ror":"https://ror.org/00rbzpz17"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":41,"referenced_works":["https://openalex.org/W18904795","https://openalex.org/W72347498","https://openalex.org/W151556337","https://openalex.org/W171871506","https://openalex.org/W1524340867","https://openalex.org/W1524940700","https://openalex.org/W1552863221","https://openalex.org/W1556927139","https://openalex.org/W1614298861","https://openalex.org/W1832693441","https://openalex.org/W1853745982","https://openalex.org/W1880262756","https://openalex.org/W1984541135","https://openalex.org/W1988596541","https://openalex.org/W1988686126","https://openalex.org/W2076762622","https://openalex.org/W2095638614","https://openalex.org/W2103635001","https://openalex.org/W2141599568","https://openalex.org/W2153579005","https://openalex.org/W2157006255","https://openalex.org/W2250539671","https://openalex.org/W2290562648","https://openalex.org/W2396216106","https://openalex.org/W2577477452","https://openalex.org/W4230856239","https://openalex.org/W4231510805","https://openalex.org/W4294170691","https://openalex.org/W6600763656","https://openalex.org/W6602935006","https://openalex.org/W6606983585","https://openalex.org/W6636510571","https://openalex.org/W6639155442","https://openalex.org/W6639619044","https://openalex.org/W6647288420","https://openalex.org/W6680890276","https://openalex.org/W6682691769","https://openalex.org/W6683240801","https://openalex.org/W6691431627","https://openalex.org/W6696537820","https://openalex.org/W6989537589"],"related_works":["https://openalex.org/W2888805565","https://openalex.org/W4312773271","https://openalex.org/W4315588616","https://openalex.org/W2769501189","https://openalex.org/W2962686197","https://openalex.org/W2207653751","https://openalex.org/W4293863151","https://openalex.org/W3159709618","https://openalex.org/W2611137333","https://openalex.org/W3005513013"],"abstract_inverted_index":{"This":[0,131],"paper":[1],"deals":[2],"with":[3],"the":[4,20,37,71,123,133],"problem":[5,21],"of":[6,22,25,43,60,112,135],"high-quality":[7],"transcription":[8],"systems":[9],"for":[10,104],"very":[11],"large":[12],"vocabulary":[13],"automatic":[14,23],"speech":[15],"recognition":[16],"(ASR).":[17],"We":[18,31],"investigate":[19],"retrieval":[24,91,113],"out-of-vocabulary":[26],"(OOV)":[27],"proper":[28],"names":[29],"(PNs).":[30],"want":[32],"to":[33,128],"take":[34],"into":[35],"account":[36],"temporal,":[38],"syntactic":[39],"and":[40,106],"semantic":[41],"context":[42,97,108],"words.":[44],"Nowadays,":[45],"Artificial":[46],"Neural":[47],"Networks":[48],"(NN)":[49],"are":[50],"widely":[51],"used":[52],"in":[53],"natural":[54],"language":[55],"processing:":[56],"continuous":[57],"space":[58],"representations":[59],"words":[61],"is":[62],"learned":[63],"automatically":[64],"from":[65],"unstructured":[66],"text":[67],"data.":[68],"To":[69],"model":[70],"latent":[72],"topics":[73],"at":[74],"document":[75],"level,":[76],"Latent":[77],"Dirichlet":[78],"Allocation":[79],"(LDA)":[80],"has":[81],"been":[82],"successful.":[83],"In":[84],"this":[85],"paper,":[86],"we":[87],"propose":[88],"OOV":[89],"PN":[90],"using":[92],"(1)":[93],"temporal":[94],"versus":[95],"topic":[96],"modeling;":[98,109],"(2)":[99],"different":[100],"word":[101],"representation":[102],"spaces":[103],"word-level":[105],"document-level":[107],"(3)":[110],"combinations":[111,126],"results.":[114,130],"Experimental":[115],"evaluation":[116],"on":[117],"broadcast":[118],"news":[119],"data":[120],"shows":[121],"that":[122],"proposed":[124],"method":[125],"lead":[127],"better":[129],"confirms":[132],"complementarity":[134],"methods.":[136]},"counts_by_year":[{"year":2018,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
