{"id":"https://openalex.org/W4408345898","doi":"https://doi.org/10.1109/icassp49660.2025.10890609","title":"Text-Aware Adapter for Few-Shot Keyword Spotting","display_name":"Text-Aware Adapter for Few-Shot Keyword Spotting","publication_year":2025,"publication_date":"2025-03-12","ids":{"openalex":"https://openalex.org/W4408345898","doi":"https://doi.org/10.1109/icassp49660.2025.10890609"},"language":"en","primary_location":{"id":"doi:10.1109/icassp49660.2025.10890609","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10890609","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101457226","display_name":"Youngmoon Jung","orcid":"https://orcid.org/0000-0002-4321-379X"},"institutions":[{"id":"https://openalex.org/I2250650973","display_name":"Samsung (South Korea)","ror":"https://ror.org/04w3jy968","country_code":"KR","type":"company","lineage":["https://openalex.org/I2250650973"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Youngmoon Jung","raw_affiliation_strings":["AI Solution Team, Samsung Research,Seoul,South Korea"],"affiliations":[{"raw_affiliation_string":"AI Solution Team, Samsung Research,Seoul,South Korea","institution_ids":["https://openalex.org/I2250650973"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100420795","display_name":"Jin-Young Lee","orcid":"https://orcid.org/0000-0002-2920-6411"},"institutions":[{"id":"https://openalex.org/I2250650973","display_name":"Samsung (South Korea)","ror":"https://ror.org/04w3jy968","country_code":"KR","type":"company","lineage":["https://openalex.org/I2250650973"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jinyoung Lee","raw_affiliation_strings":["AI Solution Team, Samsung Research,Seoul,South Korea"],"affiliations":[{"raw_affiliation_string":"AI Solution Team, Samsung Research,Seoul,South Korea","institution_ids":["https://openalex.org/I2250650973"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101690593","display_name":"Seung\u2010Jin Lee","orcid":"https://orcid.org/0000-0001-7109-6423"},"institutions":[{"id":"https://openalex.org/I2250650973","display_name":"Samsung (South Korea)","ror":"https://ror.org/04w3jy968","country_code":"KR","type":"company","lineage":["https://openalex.org/I2250650973"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Seungjin Lee","raw_affiliation_strings":["AI Solution Team, Samsung Research,Seoul,South Korea"],"affiliations":[{"raw_affiliation_string":"AI Solution Team, Samsung Research,Seoul,South Korea","institution_ids":["https://openalex.org/I2250650973"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070542048","display_name":"Myunghun Jung","orcid":null},"institutions":[{"id":"https://openalex.org/I2250650973","display_name":"Samsung (South Korea)","ror":"https://ror.org/04w3jy968","country_code":"KR","type":"company","lineage":["https://openalex.org/I2250650973"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Myunghun Jung","raw_affiliation_strings":["AI Solution Team, Samsung Research,Seoul,South Korea"],"affiliations":[{"raw_affiliation_string":"AI Solution Team, Samsung Research,Seoul,South Korea","institution_ids":["https://openalex.org/I2250650973"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030203043","display_name":"Yong-Hyeok Lee","orcid":"https://orcid.org/0000-0002-2972-9474"},"institutions":[{"id":"https://openalex.org/I2250650973","display_name":"Samsung (South Korea)","ror":"https://ror.org/04w3jy968","country_code":"KR","type":"company","lineage":["https://openalex.org/I2250650973"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Yong-Hyeok Lee","raw_affiliation_strings":["AI Solution Team, Samsung Research,Seoul,South Korea"],"affiliations":[{"raw_affiliation_string":"AI Solution Team, Samsung Research,Seoul,South Korea","institution_ids":["https://openalex.org/I2250650973"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5052468556","display_name":"Hoon Young Cho","orcid":"https://orcid.org/0000-0002-6850-6580"},"institutions":[{"id":"https://openalex.org/I2250650973","display_name":"Samsung (South Korea)","ror":"https://ror.org/04w3jy968","country_code":"KR","type":"company","lineage":["https://openalex.org/I2250650973"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Hoon-Young Cho","raw_affiliation_strings":["AI Solution Team, Samsung Research,Seoul,South Korea"],"affiliations":[{"raw_affiliation_string":"AI Solution Team, Samsung Research,Seoul,South Korea","institution_ids":["https://openalex.org/I2250650973"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5101457226"],"corresponding_institution_ids":["https://openalex.org/I2250650973"],"apc_list":null,"apc_paid":null,"fwci":4.3637,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.9336229,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9883999824523926,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9883999824523926,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/keyword-spotting","display_name":"Keyword spotting","score":0.804991602897644},{"id":"https://openalex.org/keywords/adapter","display_name":"Adapter (computing)","score":0.7786943912506104},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7312036752700806},{"id":"https://openalex.org/keywords/spotting","display_name":"Spotting","score":0.7130140066146851},{"id":"https://openalex.org/keywords/shot","display_name":"Shot (pellet)","score":0.5505528450012207},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3834327459335327},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.12747642397880554}],"concepts":[{"id":"https://openalex.org/C2781213101","wikidata":"https://www.wikidata.org/wiki/Q6398558","display_name":"Keyword spotting","level":2,"score":0.804991602897644},{"id":"https://openalex.org/C177284502","wikidata":"https://www.wikidata.org/wiki/Q1005390","display_name":"Adapter (computing)","level":2,"score":0.7786943912506104},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7312036752700806},{"id":"https://openalex.org/C2779506182","wikidata":"https://www.wikidata.org/wiki/Q7580141","display_name":"Spotting","level":2,"score":0.7130140066146851},{"id":"https://openalex.org/C2778344882","wikidata":"https://www.wikidata.org/wiki/Q278938","display_name":"Shot (pellet)","level":2,"score":0.5505528450012207},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3834327459335327},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.12747642397880554},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp49660.2025.10890609","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10890609","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":34,"referenced_works":["https://openalex.org/W1496120315","https://openalex.org/W2034940213","https://openalex.org/W2407023693","https://openalex.org/W2603777577","https://openalex.org/W2696967604","https://openalex.org/W2752782242","https://openalex.org/W2928165649","https://openalex.org/W2964187693","https://openalex.org/W2964271799","https://openalex.org/W3024869864","https://openalex.org/W3095180122","https://openalex.org/W3095694146","https://openalex.org/W3095706145","https://openalex.org/W3099793224","https://openalex.org/W3144247233","https://openalex.org/W3162273446","https://openalex.org/W3197564965","https://openalex.org/W4296069322","https://openalex.org/W4319862287","https://openalex.org/W4372260220","https://openalex.org/W4372267453","https://openalex.org/W4372271885","https://openalex.org/W4385822437","https://openalex.org/W4385823146","https://openalex.org/W4385823483","https://openalex.org/W4392904395","https://openalex.org/W4402111546","https://openalex.org/W4402111963","https://openalex.org/W4402112069","https://openalex.org/W4402112278","https://openalex.org/W6688816777","https://openalex.org/W6731763572","https://openalex.org/W6738045163","https://openalex.org/W6750665317"],"related_works":["https://openalex.org/W2918559346","https://openalex.org/W2114097550","https://openalex.org/W4286904253","https://openalex.org/W3119978414","https://openalex.org/W2516975559","https://openalex.org/W3206647229","https://openalex.org/W1969408022","https://openalex.org/W2000885660","https://openalex.org/W2545741539","https://openalex.org/W1989658893"],"abstract_inverted_index":{"Recent":[0],"advances":[1],"in":[2,27,145],"flexible":[3,51],"keyword":[4,29],"spotting":[5],"(KWS)":[6],"with":[7,57,140],"text":[8,71,76],"enrollment":[9],"allow":[10],"users":[11],"to":[12,47,73,115],"personalize":[13],"keywords":[14,56,132],"without":[15],"uttering":[16],"them":[17],"during":[18],"enrollment.":[19],"However,":[20],"there":[21],"is":[22],"still":[23],"room":[24],"for":[25,54,84,108],"improvement":[26],"target":[28],"performance.":[30],"In":[31,120],"this":[32],"work,":[33],"we":[34,66],"propose":[35],"a":[36,49,68,75,81,90,112,142],"novel":[37],"few-shot":[38,109],"transfer":[39],"learning":[40],"method,":[41],"called":[42],"text-aware":[43],"adapter":[44],"(TA-adapter),":[45],"designed":[46],"enhance":[48],"pre-trained":[50,70,118],"KWS":[52],"model":[53],"specific":[55],"limited":[58],"speech":[59],"samples.":[60],"To":[61],"adapt":[62],"the":[63,85,94,98,103,116,123,134,146],"acoustic":[64],"encoder,":[65],"leverage":[67],"jointly":[69],"encoder":[72],"generate":[74],"embedding":[77],"that":[78],"acts":[79],"as":[80],"representative":[82],"vector":[83],"keyword.":[86],"By":[87],"fine-tuning":[88],"only":[89,141],"small":[91],"portion":[92],"of":[93,149],"network":[95],"while":[96],"keeping":[97],"core":[99],"components\u2019":[100],"weights":[101],"intact,":[102],"TA-adapter":[104,124],"proves":[105],"highly":[106],"efficient":[107],"KWS,":[110],"enabling":[111],"seamless":[113],"return":[114],"original":[117],"model.":[119],"our":[121],"experiments,":[122],"demonstrated":[125],"significant":[126],"performance":[127],"improvements":[128],"across":[129],"35":[130],"distinct":[131],"from":[133],"Google":[135],"Speech":[136],"Commands":[137],"V2":[138],"dataset,":[139],"0.14%":[143],"increase":[144],"total":[147],"number":[148],"parameters.":[150]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-23T09:07:50.710637","created_date":"2025-10-10T00:00:00"}
