{"id":"https://openalex.org/W4405419027","doi":"https://doi.org/10.48550/arxiv.2408.11799","title":"Practical token pruning for foundation models in few-shot conversational virtual assistant systems","display_name":"Practical token pruning for foundation models in few-shot conversational virtual assistant systems","publication_year":2024,"publication_date":"2024-08-21","ids":{"openalex":"https://openalex.org/W4405419027","doi":"https://doi.org/10.48550/arxiv.2408.11799"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2408.11799","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2408.11799","pdf_url":"https://arxiv.org/pdf/2408.11799","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2408.11799","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5008247625","display_name":"Haode Qi","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Qi, Haode","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100966459","display_name":"Cheng Qian","orcid":"https://orcid.org/0000-0001-9913-820X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qian, Cheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102724821","display_name":"Jian Ni","orcid":"https://orcid.org/0000-0002-9307-4783"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ni, Jian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037122155","display_name":"Pratyush Singh","orcid":"https://orcid.org/0000-0002-1818-9724"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Singh, Pratyush","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069042586","display_name":"Reza Fazeli","orcid":"https://orcid.org/0000-0002-0322-5235"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fazeli, Reza","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091186428","display_name":"Gengyu Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Gengyu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052478171","display_name":"Zhenqiu Shu","orcid":"https://orcid.org/0009-0007-7972-1300"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shu, Zhongzheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5099137290","display_name":"Eric Wayne","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wayne, Eric","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5012628002","display_name":"Juergen Bross","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bross, Juergen","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5008247625"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9864000082015991,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9864000082015991,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10456","display_name":"Multi-Agent Systems and Negotiation","score":0.9689000248908997,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9666000008583069,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.8249666690826416},{"id":"https://openalex.org/keywords/foundation","display_name":"Foundation (evidence)","score":0.743408739566803},{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.6900599598884583},{"id":"https://openalex.org/keywords/shot","display_name":"Shot (pellet)","score":0.6761057376861572},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.619337260723114},{"id":"https://openalex.org/keywords/one-shot","display_name":"One shot","score":0.5082723498344421},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.40008583664894104},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.35694625973701477},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.30192816257476807},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.23420238494873047},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.10544589161872864}],"concepts":[{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.8249666690826416},{"id":"https://openalex.org/C2780966255","wikidata":"https://www.wikidata.org/wiki/Q5474306","display_name":"Foundation (evidence)","level":2,"score":0.743408739566803},{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.6900599598884583},{"id":"https://openalex.org/C2778344882","wikidata":"https://www.wikidata.org/wiki/Q278938","display_name":"Shot (pellet)","level":2,"score":0.6761057376861572},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.619337260723114},{"id":"https://openalex.org/C2992734406","wikidata":"https://www.wikidata.org/wiki/Q413267","display_name":"One shot","level":2,"score":0.5082723498344421},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.40008583664894104},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.35694625973701477},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.30192816257476807},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.23420238494873047},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.10544589161872864},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2408.11799","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2408.11799","pdf_url":"https://arxiv.org/pdf/2408.11799","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2408.11799","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2408.11799","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2408.11799","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2408.11799","pdf_url":"https://arxiv.org/pdf/2408.11799","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4405419027.pdf","grobid_xml":"https://content.openalex.org/works/W4405419027.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2497720472","https://openalex.org/W4292659306","https://openalex.org/W3044321615","https://openalex.org/W2806221744","https://openalex.org/W2326937258","https://openalex.org/W394267150","https://openalex.org/W2773965352","https://openalex.org/W4294892107","https://openalex.org/W2357748469","https://openalex.org/W2392917037"],"abstract_inverted_index":{"In":[0],"an":[1],"enterprise":[2],"Virtual":[3],"Assistant":[4],"(VA)":[5],"system,":[6],"intent":[7,79,100,153],"classification":[8,80,101],"is":[9,19,30],"the":[10,24,70,73,85,111,121,125,147,161],"crucial":[11],"component":[12],"that":[13,141,157],"determines":[14],"how":[15],"a":[16,34,50,58,64,107,136],"user":[17,25,117],"input":[18],"handled":[20],"based":[21],"on":[22,98],"what":[23],"wants.":[26],"The":[27],"VA":[28],"system":[29],"expected":[31],"to":[32,120],"be":[33],"cost-efficient":[35],"SaaS":[36],"service":[37],"with":[38,49,63],"low":[39],"training":[40,54,78,151],"and":[41,68,91],"inference":[42,112,162],"time":[43],"while":[44],"achieving":[45],"high":[46],"accuracy":[47],"even":[48],"small":[51],"number":[52],"of":[53,72,124,131,164],"samples.":[55],"We":[56,155],"pretrain":[57],"transformer-based":[59,108],"sentence":[60,166],"embedding":[61,71],"model":[62,74,109,132,171],"contrastive":[65],"learning":[66],"objective":[67],"leverage":[69],"as":[75],"features":[76,105],"when":[77],"models.":[81],"Our":[82],"approach":[83,140,159],"achieves":[84],"state-of-the-art":[86],"results":[87],"for":[88,115,149,152],"few-shot":[89],"scenarios":[90],"performs":[92],"better":[93],"than":[94],"other":[95],"commercial":[96],"solutions":[97],"popular":[99,165],"benchmarks.":[102],"However,":[103],"generating":[104],"via":[106],"increases":[110],"time,":[113],"especially":[114],"longer":[116],"inputs,":[118],"due":[119],"quadratic":[122],"runtime":[123],"transformer's":[126],"attention":[127],"mechanism.":[128],"On":[129],"top":[130],"distillation,":[133],"we":[134],"introduce":[135],"practical":[137],"multi-task":[138],"adaptation":[139],"configures":[142],"dynamic":[143],"token":[144],"pruning":[145],"without":[146,169],"need":[148],"task-specific":[150],"classification.":[154],"demonstrate":[156],"this":[158],"improves":[160],"speed":[163],"transformer":[167],"models":[168],"affecting":[170],"performance.":[172]},"counts_by_year":[],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
