{"id":"https://openalex.org/W4402112325","doi":"https://doi.org/10.21437/interspeech.2024-2457","title":"Beam-search SIEVE for low-memory speech recognition","display_name":"Beam-search SIEVE for low-memory speech recognition","publication_year":2024,"publication_date":"2024-09-01","ids":{"openalex":"https://openalex.org/W4402112325","doi":"https://doi.org/10.21437/interspeech.2024-2457"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2024-2457","is_oa":false,"landing_page_url":"http://dx.doi.org/10.21437/interspeech.2024-2457","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2024","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://researchprofiles.ku.dk/da/publications/156cb9a9-01b9-4e94-83b9-de10f68ddef7","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5054507372","display_name":"Martino Ciaperoni","orcid":"https://orcid.org/0009-0009-7581-2031"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Martino Ciaperoni","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003869083","display_name":"Athanasios Katsamanis","orcid":"https://orcid.org/0000-0002-2642-2354"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Athanasios Katsamanis","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022164041","display_name":"Aristides Gionis","orcid":"https://orcid.org/0000-0002-5211-112X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Aristides Gionis","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5103092057","display_name":"Panagiotis Karras","orcid":"https://orcid.org/0000-0003-0509-9129"},"institutions":[{"id":"https://openalex.org/I4210137115","display_name":"Data & Society Research Institute","ror":"https://ror.org/04dse4f93","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I4210137115"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Panagiotis Karras","raw_affiliation_strings":["K\u00f8benhavns Universitet, Faculty of Science, Department of Computer Science, Software, Data, People & Society, DK"],"affiliations":[{"raw_affiliation_string":"K\u00f8benhavns Universitet, Faculty of Science, Department of Computer Science, Software, Data, People & Society, DK","institution_ids":["https://openalex.org/I4210137115"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5054507372"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.12276474,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"272","last_page":"276"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11609","display_name":"Geophysical Methods and Applications","score":0.9839000105857849,"subfield":{"id":"https://openalex.org/subfields/2212","display_name":"Ocean Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7748766541481018},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.7453545331954956},{"id":"https://openalex.org/keywords/beam-search","display_name":"Beam search","score":0.6503443121910095},{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.5776347517967224},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.5548132061958313},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.42646947503089905},{"id":"https://openalex.org/keywords/sieve","display_name":"Sieve (category theory)","score":0.42026659846305847},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.39883121848106384},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.37744051218032837},{"id":"https://openalex.org/keywords/search-algorithm","display_name":"Search algorithm","score":0.37631577253341675},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.3221970796585083},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3181542754173279},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.21058803796768188},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.1547640562057495}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7748766541481018},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.7453545331954956},{"id":"https://openalex.org/C19889080","wikidata":"https://www.wikidata.org/wiki/Q2835852","display_name":"Beam search","level":3,"score":0.6503443121910095},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.5776347517967224},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.5548132061958313},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.42646947503089905},{"id":"https://openalex.org/C17732976","wikidata":"https://www.wikidata.org/wiki/Q7511782","display_name":"Sieve (category theory)","level":2,"score":0.42026659846305847},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.39883121848106384},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.37744051218032837},{"id":"https://openalex.org/C125583679","wikidata":"https://www.wikidata.org/wiki/Q755673","display_name":"Search algorithm","level":2,"score":0.37631577253341675},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.3221970796585083},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3181542754173279},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.21058803796768188},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.1547640562057495},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.21437/interspeech.2024-2457","is_oa":false,"landing_page_url":"http://dx.doi.org/10.21437/interspeech.2024-2457","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2024","raw_type":"proceedings-article"},{"id":"pmh:oai:pure.atira.dk:openaire_cris_publications/156cb9a9-01b9-4e94-83b9-de10f68ddef7","is_oa":true,"landing_page_url":"https://researchprofiles.ku.dk/da/publications/156cb9a9-01b9-4e94-83b9-de10f68ddef7","pdf_url":null,"source":{"id":"https://openalex.org/S4306401983","display_name":"Research at the University of Copenhagen (University of Copenhagen)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I124055696","host_organization_name":"University of Copenhagen","host_organization_lineage":["https://openalex.org/I124055696"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Ciaperoni , M , Katsamanis , A , Gionis , A & Karras , P 2024 , Beam-search SIEVE for low-memory speech recognition . in Interspeech 2024 - Proceedings of the Annual Conference of the International Speech Communication Association, INTERSPEECH . International Speech Communication Association (ISCA) , pp. 272-276 , 25th Interspeech Conferece 2024 , Kos Island , Greece , 01/09/2024 . https://doi.org/10.21437/Interspeech.2024-2457","raw_type":"contributionToPeriodical"}],"best_oa_location":{"id":"pmh:oai:pure.atira.dk:openaire_cris_publications/156cb9a9-01b9-4e94-83b9-de10f68ddef7","is_oa":true,"landing_page_url":"https://researchprofiles.ku.dk/da/publications/156cb9a9-01b9-4e94-83b9-de10f68ddef7","pdf_url":null,"source":{"id":"https://openalex.org/S4306401983","display_name":"Research at the University of Copenhagen (University of Copenhagen)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I124055696","host_organization_name":"University of Copenhagen","host_organization_lineage":["https://openalex.org/I124055696"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Ciaperoni , M , Katsamanis , A , Gionis , A & Karras , P 2024 , Beam-search SIEVE for low-memory speech recognition . in Interspeech 2024 - Proceedings of the Annual Conference of the International Speech Communication Association, INTERSPEECH . International Speech Communication Association (ISCA) , pp. 272-276 , 25th Interspeech Conferece 2024 , Kos Island , Greece , 01/09/2024 . https://doi.org/10.21437/Interspeech.2024-2457","raw_type":"contributionToPeriodical"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/5","score":0.4099999964237213,"display_name":"Gender equality"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2891987081","https://openalex.org/W4386269615","https://openalex.org/W4390091683","https://openalex.org/W1994919150","https://openalex.org/W58921990","https://openalex.org/W2204575588","https://openalex.org/W2081821176","https://openalex.org/W2159879965","https://openalex.org/W3084994579","https://openalex.org/W2998661990"],"abstract_inverted_index":{"A":[0,73],"capacity":[1],"to":[2,18,133,138],"recognize":[3],"speech":[4,24],"offline":[5],"eliminates":[6,81],"privacy":[7],"concerns":[8],"and":[9,31,121,136,144],"the":[10,20,48,56,77,82,114],"need":[11],"for":[12],"an":[13],"internet":[14],"connection.":[15],"Despite":[16],"efforts":[17],"reduce":[19],"memory":[21,60,126,139],"demands":[22,28],"of":[23,53,76,103,117],"recognition":[25],"systems,":[26],"these":[27],"remain":[29],"formidable":[30],"thus":[32],"popular":[33],"tools":[34],"such":[35,54],"as":[36],"Kaldi":[37],"run":[38],"best":[39],"via":[40,70,110],"cloud":[41],"computing.":[42],"The":[43],"key":[44],"bottleneck":[45],"arises":[46],"form":[47],"fact":[49],"that":[50,61,105],"a":[51,91,101],"bedrock":[52],"tools,":[55],"Viterbi":[57,78],"algorithm,":[58,79],"requires":[59],"grows":[62],"linearly":[63,124],"with":[64,90],"utterance":[65],"length":[66,84],"even":[67],"when":[68],"contained":[69],"beam":[71,111,119],"search.":[72],"recent":[74],"recasting":[75],"SIEVE,":[80],"path":[83],"factor":[85],"from":[86],"space":[87],"complexity,":[88],"but":[89],"significant":[92],"practical":[93],"runtime":[94,108],"overhead.":[95],"In":[96],"this":[97,107],"paper,":[98],"we":[99],"develop":[100],"variant":[102],"SIEVE":[104],"lessens":[106],"overhead":[109],"search,":[112,120],"retains":[113],"decoding":[115,134],"quality":[116,135],"standard":[118],"waives":[122],"its":[123],"growing":[125],"bottleneck.":[127],"This":[128],"space-complexity":[129],"reduction":[130],"is":[131],"orthogonal":[132],"complementary":[137],"savings":[140],"in":[141],"model":[142],"representation":[143],"training.":[145]},"counts_by_year":[],"updated_date":"2026-03-21T08:13:44.787528","created_date":"2025-10-10T00:00:00"}
