{"id":"https://openalex.org/W4385489560","doi":"https://doi.org/10.1109/taslp.2023.3301239","title":"End-to-End Open Vocabulary Keyword Search With Multilingual Neural Representations","display_name":"End-to-End Open Vocabulary Keyword Search With Multilingual Neural Representations","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4385489560","doi":"https://doi.org/10.1109/taslp.2023.3301239"},"language":"en","primary_location":{"id":"doi:10.1109/taslp.2023.3301239","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2023.3301239","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2308.08027","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5007614006","display_name":"Bolaji Yusuf","orcid":"https://orcid.org/0000-0001-9852-3456"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Bolaji Yusuf","raw_affiliation_strings":["Department of Electrical and Electronics Engineering, Bo&#x011F;azi&#x00E7;i University, Istanbul, Turkey"],"raw_orcid":"https://orcid.org/0000-0001-9852-3456","affiliations":[{"raw_affiliation_string":"Department of Electrical and Electronics Engineering, Bo&#x011F;azi&#x00E7;i University, Istanbul, Turkey","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045539248","display_name":"Ja\u0148 \u010cernock\u00fd","orcid":"https://orcid.org/0000-0002-8800-0210"},"institutions":[{"id":"https://openalex.org/I60587646","display_name":"Brno University of Technology","ror":"https://ror.org/03613d656","country_code":"CZ","type":"education","lineage":["https://openalex.org/I60587646"]}],"countries":["CZ"],"is_corresponding":false,"raw_author_name":"Jan \u010cernock\u00fd","raw_affiliation_strings":["Faculty of Information Technology, Speech@FIT, Brno University of Technology, Brno, Czechia","Faculty of Information Technology, Brno University of Technology, Speech@FIT, Brno, Czechia"],"raw_orcid":"https://orcid.org/0000-0002-8800-0210","affiliations":[{"raw_affiliation_string":"Faculty of Information Technology, Speech@FIT, Brno University of Technology, Brno, Czechia","institution_ids":["https://openalex.org/I60587646"]},{"raw_affiliation_string":"Faculty of Information Technology, Brno University of Technology, Speech@FIT, Brno, Czechia","institution_ids":["https://openalex.org/I60587646"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5055086464","display_name":"Murat Sara\u00e7lar","orcid":"https://orcid.org/0000-0002-7435-8510"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Murat Sara\u00e7lar","raw_affiliation_strings":["Department of Electrical and Electronics Engineering, Bo&#x011F;azi&#x00E7;i University, Istanbul, Turkey"],"raw_orcid":"https://orcid.org/0000-0002-7435-8510","affiliations":[{"raw_affiliation_string":"Department of Electrical and Electronics Engineering, Bo&#x011F;azi&#x00E7;i University, Istanbul, Turkey","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5007614006"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.8284,"has_fulltext":true,"cited_by_count":5,"citation_normalized_percentile":{"value":0.78157383,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":"31","issue":null,"first_page":"3070","last_page":"3080"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.863613486289978},{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.7881330251693726},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.7638682723045349},{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.6394062638282776},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.5468875169754028},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5055904388427734},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.5055651664733887},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4936305284500122},{"id":"https://openalex.org/keywords/search-engine","display_name":"Search engine","score":0.4478897154331207},{"id":"https://openalex.org/keywords/keyword-spotting","display_name":"Keyword spotting","score":0.425646036863327},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4235613942146301},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.41289815306663513},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4026719331741333}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.863613486289978},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.7881330251693726},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.7638682723045349},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.6394062638282776},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.5468875169754028},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5055904388427734},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.5055651664733887},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4936305284500122},{"id":"https://openalex.org/C97854310","wikidata":"https://www.wikidata.org/wiki/Q19541","display_name":"Search engine","level":2,"score":0.4478897154331207},{"id":"https://openalex.org/C2781213101","wikidata":"https://www.wikidata.org/wiki/Q6398558","display_name":"Keyword spotting","level":2,"score":0.425646036863327},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4235613942146301},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.41289815306663513},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4026719331741333},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/taslp.2023.3301239","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2023.3301239","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2308.08027","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2308.08027","pdf_url":"https://arxiv.org/pdf/2308.08027","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2308.08027","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2308.08027","pdf_url":"https://arxiv.org/pdf/2308.08027","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.5099999904632568,"display_name":"Quality Education"}],"awards":[{"id":"https://openalex.org/G1319050382","display_name":null,"funder_award_id":"19-26934X","funder_id":"https://openalex.org/F4320321006","funder_display_name":"Grantov\u00e1 Agentura \u010cesk\u00e9 Republiky"},{"id":"https://openalex.org/G3708067221","display_name":null,"funder_award_id":"90140","funder_id":"https://openalex.org/F4320321006","funder_display_name":"Grantov\u00e1 Agentura \u010cesk\u00e9 Republiky"},{"id":"https://openalex.org/G4177337698","display_name":null,"funder_award_id":"ID:90140","funder_id":"https://openalex.org/F4320321006","funder_display_name":"Grantov\u00e1 Agentura \u010cesk\u00e9 Republiky"},{"id":"https://openalex.org/G7097781310","display_name":null,"funder_award_id":"870930","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320320300","display_name":"European Commission","ror":"https://ror.org/00k4n6c32"},{"id":"https://openalex.org/F4320321006","display_name":"Grantov\u00e1 Agentura \u010cesk\u00e9 Republiky","ror":"https://ror.org/01pv73b02"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4385489560.pdf","grobid_xml":"https://content.openalex.org/works/W4385489560.grobid-xml"},"referenced_works_count":93,"referenced_works":["https://openalex.org/W49437105","https://openalex.org/W114193738","https://openalex.org/W319941341","https://openalex.org/W1494198834","https://openalex.org/W1501286448","https://openalex.org/W1607149136","https://openalex.org/W1970890968","https://openalex.org/W1978660892","https://openalex.org/W1990294375","https://openalex.org/W1992912377","https://openalex.org/W2000654171","https://openalex.org/W2005232502","https://openalex.org/W2015688877","https://openalex.org/W2031804986","https://openalex.org/W2040070072","https://openalex.org/W2050309898","https://openalex.org/W2056346282","https://openalex.org/W2057007397","https://openalex.org/W2074932712","https://openalex.org/W2075201173","https://openalex.org/W2089537772","https://openalex.org/W2090755665","https://openalex.org/W2090764203","https://openalex.org/W2106440210","https://openalex.org/W2111955662","https://openalex.org/W2119689163","https://openalex.org/W2124509324","https://openalex.org/W2124558353","https://openalex.org/W2129059886","https://openalex.org/W2137044559","https://openalex.org/W2141315442","https://openalex.org/W2142986430","https://openalex.org/W2148986421","https://openalex.org/W2152753389","https://openalex.org/W2153141912","https://openalex.org/W2167338739","https://openalex.org/W2171019095","https://openalex.org/W2186490579","https://openalex.org/W2187428966","https://openalex.org/W2291975472","https://openalex.org/W2402112460","https://openalex.org/W2402146185","https://openalex.org/W2404324365","https://openalex.org/W2407080277","https://openalex.org/W2407420912","https://openalex.org/W2407897255","https://openalex.org/W2442329935","https://openalex.org/W2578392894","https://openalex.org/W2612800309","https://openalex.org/W2697044473","https://openalex.org/W2716988359","https://openalex.org/W2746887616","https://openalex.org/W2762466393","https://openalex.org/W2767122664","https://openalex.org/W2900678559","https://openalex.org/W2944113786","https://openalex.org/W2964012862","https://openalex.org/W2972476119","https://openalex.org/W2972613398","https://openalex.org/W2973132140","https://openalex.org/W2995181338","https://openalex.org/W3015280134","https://openalex.org/W3015449694","https://openalex.org/W3015522062","https://openalex.org/W3019546258","https://openalex.org/W3024786184","https://openalex.org/W3033038061","https://openalex.org/W3036601975","https://openalex.org/W3041561163","https://openalex.org/W3095694146","https://openalex.org/W3096014412","https://openalex.org/W3161143478","https://openalex.org/W3162022030","https://openalex.org/W3163464943","https://openalex.org/W3176711365","https://openalex.org/W3181776258","https://openalex.org/W3196482042","https://openalex.org/W3197175124","https://openalex.org/W3197681820","https://openalex.org/W3207815550","https://openalex.org/W3213029956","https://openalex.org/W4225308107","https://openalex.org/W4225319488","https://openalex.org/W4226082499","https://openalex.org/W4226093136","https://openalex.org/W4226120743","https://openalex.org/W4287630531","https://openalex.org/W4297841501","https://openalex.org/W4372262245","https://openalex.org/W4385489560","https://openalex.org/W6611122713","https://openalex.org/W6714284179","https://openalex.org/W6718561954"],"related_works":["https://openalex.org/W2114097550","https://openalex.org/W4385352507","https://openalex.org/W2918559346","https://openalex.org/W84309476","https://openalex.org/W4286904253","https://openalex.org/W4282568653","https://openalex.org/W2149998531","https://openalex.org/W2119380317","https://openalex.org/W2070155952","https://openalex.org/W2082868123"],"abstract_inverted_index":{"Conventional":[0],"keyword":[1,41,115],"search":[2,20,33,42,116],"systems":[3],"operate":[4],"on":[5],"automatic":[6],"speech":[7],"recognition":[8],"(ASR)":[9],"outputs,":[10],"which":[11,44],"causes":[12],"them":[13],"to":[14,25,30],"have":[15],"a":[16,38,62,75,111],"complex":[17],"indexing":[18],"and":[19,52,57,69,87,106,121,136],"pipeline.":[21],"This":[22],"has":[23],"led":[24],"interest":[26],"in":[27,142],"ASR-free":[28,40],"approaches":[29],"simplify":[31],"the":[32,70,91,97,103,126,130,143],"procedure.":[34],"We":[35],"recently":[36],"proposed":[37,98,127],"neural":[39,66],"model":[43,104,128],"achieves":[45],"competitive":[46],"performance":[47,105],"while":[48],"maintaining":[49],"an":[50],"efficient":[51],"simplified":[53],"pipeline,":[54],"where":[55],"queries":[56,120,122,135,137],"documents":[58],"are":[59,72],"encoded":[60],"with":[61,74,84],"pair":[63],"of":[64,90],"recurrent":[65],"network":[67],"encoders":[68],"encodings":[71],"combined":[73],"dot-product.":[76],"In":[77],"this":[78,82],"paper,":[79],"we":[80],"extend":[81],"work":[83],"multilingual":[85,99],"pretraining":[86],"detailed":[88],"analysis":[89],"model.":[92],"Our":[93],"experiments":[94],"show":[95],"that":[96,107,138],"training":[100,144],"significantly":[101],"improves":[102],"despite":[108],"not":[109,140],"matching":[110],"strong":[112],"ASR-based":[113,131],"conventional":[114],"system":[117,132],"for":[118,133],"short":[119],"comprising":[123],"in-vocabulary":[124],"words,":[125],"outperforms":[129],"long":[134],"do":[139],"appear":[141],"data.":[145]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2026-05-23T08:51:43.019350","created_date":"2025-10-10T00:00:00"}
