{"id":"https://openalex.org/W4392903952","doi":"https://doi.org/10.1109/icassp48485.2024.10447812","title":"Sensi-Bert: Towards Sensitivity Driven Fine-Tuning for Parameter-Efficient Language Model","display_name":"Sensi-Bert: Towards Sensitivity Driven Fine-Tuning for Parameter-Efficient Language Model","publication_year":2024,"publication_date":"2024-03-18","ids":{"openalex":"https://openalex.org/W4392903952","doi":"https://doi.org/10.1109/icassp48485.2024.10447812"},"language":"en","primary_location":{"id":"doi:10.1109/icassp48485.2024.10447812","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/icassp48485.2024.10447812","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5087095284","display_name":"Souvik Kundu","orcid":"https://orcid.org/0000-0001-5815-8765"},"institutions":[{"id":"https://openalex.org/I1343180700","display_name":"Intel (United States)","ror":"https://ror.org/01ek73717","country_code":"US","type":"company","lineage":["https://openalex.org/I1343180700"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Souvik Kundu","raw_affiliation_strings":["Intel Labs,San Diego,USA","Intel Labs, San Diego, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Intel Labs,San Diego,USA","institution_ids":["https://openalex.org/I1343180700"]},{"raw_affiliation_string":"Intel Labs, San Diego, USA","institution_ids":["https://openalex.org/I1343180700"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101153316","display_name":"Sharath Nittur Sridhar","orcid":null},"institutions":[{"id":"https://openalex.org/I1343180700","display_name":"Intel (United States)","ror":"https://ror.org/01ek73717","country_code":"US","type":"company","lineage":["https://openalex.org/I1343180700"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sharath Nittur Sridhar","raw_affiliation_strings":["Intel Labs,San Diego,USA","Intel Labs, San Diego, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Intel Labs,San Diego,USA","institution_ids":["https://openalex.org/I1343180700"]},{"raw_affiliation_string":"Intel Labs, San Diego, USA","institution_ids":["https://openalex.org/I1343180700"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059919489","display_name":"Maciej Szankin","orcid":"https://orcid.org/0000-0002-2544-1393"},"institutions":[{"id":"https://openalex.org/I1343180700","display_name":"Intel (United States)","ror":"https://ror.org/01ek73717","country_code":"US","type":"company","lineage":["https://openalex.org/I1343180700"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Maciej Szankin","raw_affiliation_strings":["Intel Labs,San Diego,USA","Intel Labs, San Diego, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Intel Labs,San Diego,USA","institution_ids":["https://openalex.org/I1343180700"]},{"raw_affiliation_string":"Intel Labs, San Diego, USA","institution_ids":["https://openalex.org/I1343180700"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5013199442","display_name":"Sairam Sundaresan","orcid":"https://orcid.org/0000-0002-6648-0591"},"institutions":[{"id":"https://openalex.org/I1343180700","display_name":"Intel (United States)","ror":"https://ror.org/01ek73717","country_code":"US","type":"company","lineage":["https://openalex.org/I1343180700"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sairam Sundaresan","raw_affiliation_strings":["Intel Labs,San Diego,USA","Intel Labs, San Diego, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Intel Labs,San Diego,USA","institution_ids":["https://openalex.org/I1343180700"]},{"raw_affiliation_string":"Intel Labs, San Diego, USA","institution_ids":["https://openalex.org/I1343180700"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.3055,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.60000943,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"2","issue":null,"first_page":"10071","last_page":"10075"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9943000078201294,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7682722210884094},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.766607403755188},{"id":"https://openalex.org/keywords/sensitivity","display_name":"Sensitivity (control systems)","score":0.5975707173347473},{"id":"https://openalex.org/keywords/flops","display_name":"FLOPS","score":0.5146487951278687},{"id":"https://openalex.org/keywords/fine-tuning","display_name":"Fine-tuning","score":0.4932515025138855},{"id":"https://openalex.org/keywords/model-parameter","display_name":"Model parameter","score":0.4522380232810974},{"id":"https://openalex.org/keywords/bridging","display_name":"Bridging (networking)","score":0.4159954786300659},{"id":"https://openalex.org/keywords/reservation","display_name":"Reservation","score":0.41490256786346436},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3430139422416687},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.19060629606246948}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7682722210884094},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.766607403755188},{"id":"https://openalex.org/C21200559","wikidata":"https://www.wikidata.org/wiki/Q7451068","display_name":"Sensitivity (control systems)","level":2,"score":0.5975707173347473},{"id":"https://openalex.org/C3826847","wikidata":"https://www.wikidata.org/wiki/Q188768","display_name":"FLOPS","level":2,"score":0.5146487951278687},{"id":"https://openalex.org/C157524613","wikidata":"https://www.wikidata.org/wiki/Q2828883","display_name":"Fine-tuning","level":2,"score":0.4932515025138855},{"id":"https://openalex.org/C2983447341","wikidata":"https://www.wikidata.org/wiki/Q1413083","display_name":"Model parameter","level":2,"score":0.4522380232810974},{"id":"https://openalex.org/C174348530","wikidata":"https://www.wikidata.org/wiki/Q188635","display_name":"Bridging (networking)","level":2,"score":0.4159954786300659},{"id":"https://openalex.org/C2777632111","wikidata":"https://www.wikidata.org/wiki/Q1937518","display_name":"Reservation","level":2,"score":0.41490256786346436},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3430139422416687},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.19060629606246948},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C24326235","wikidata":"https://www.wikidata.org/wiki/Q126095","display_name":"Electronic engineering","level":1,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp48485.2024.10447812","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/icassp48485.2024.10447812","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":46,"referenced_works":["https://openalex.org/W2896457183","https://openalex.org/W2923014074","https://openalex.org/W2962818002","https://openalex.org/W2963748441","https://openalex.org/W2963846996","https://openalex.org/W2965373594","https://openalex.org/W2970454332","https://openalex.org/W2975429091","https://openalex.org/W2978017171","https://openalex.org/W2978670439","https://openalex.org/W2996428491","https://openalex.org/W3015233032","https://openalex.org/W3034457371","https://openalex.org/W3095319910","https://openalex.org/W3101248447","https://openalex.org/W3104263050","https://openalex.org/W3105966348","https://openalex.org/W3167266074","https://openalex.org/W3177265267","https://openalex.org/W3214153155","https://openalex.org/W4205807230","https://openalex.org/W4226073878","https://openalex.org/W4245958820","https://openalex.org/W4280575426","https://openalex.org/W4287777801","https://openalex.org/W4384918448","https://openalex.org/W4385573119","https://openalex.org/W4385805166","https://openalex.org/W4386185625","https://openalex.org/W6605323724","https://openalex.org/W6691459498","https://openalex.org/W6737236263","https://openalex.org/W6750615492","https://openalex.org/W6755207826","https://openalex.org/W6766673545","https://openalex.org/W6767719158","https://openalex.org/W6768021236","https://openalex.org/W6768086466","https://openalex.org/W6768851824","https://openalex.org/W6776129198","https://openalex.org/W6777017071","https://openalex.org/W6780482815","https://openalex.org/W6803882846","https://openalex.org/W6810893473","https://openalex.org/W6849467956","https://openalex.org/W6854866820"],"related_works":["https://openalex.org/W4315697128","https://openalex.org/W3102845713","https://openalex.org/W2971502891","https://openalex.org/W3205506801","https://openalex.org/W4280599700","https://openalex.org/W3023285645","https://openalex.org/W3037551068","https://openalex.org/W3023594376","https://openalex.org/W4287802662","https://openalex.org/W4309877123"],"abstract_inverted_index":{"Large":[0],"pre-trained":[1,90],"language":[2],"models":[3,49,65,84,97],"have":[4],"recently":[5],"gained":[6],"significant":[7],"traction":[8],"due":[9],"to":[10,66,107,117,160],"their":[11,31,37],"improved":[12],"performance":[13,69,152],"on":[14,39,52,61],"various":[15,161],"down-stream":[16],"tasks":[17,140],"like":[18],"text":[19],"classification":[20],"and":[21,55,93,148],"question":[22],"answering,":[23],"requiring":[24],"only":[25],"few":[26],"epochs":[27],"of":[28,45,82,135],"fine-tuning.":[29,56],"However,":[30],"large":[32],"model":[33,92],"sizes":[34],"often":[35,59],"prohibit":[36],"applications":[38],"resource-constrained":[40],"edge":[41],"devices.":[42],"Existing":[43],"solutions":[44],"yielding":[46],"parameter-efficient":[47,96],"BERT":[48,83,91],"largely":[50],"rely":[51,60],"compute-exhaustive":[53],"training":[54],"Moreover,":[57],"they":[58],"additional":[62],"compute":[63],"heavy":[64],"mitigate":[67],"the":[68,133],"gap.":[70],"In":[71,101],"this":[72],"paper,":[73],"we":[74,103],"present":[75],"Sensi-BERT,":[76],"a":[77,124],"sensitivity":[78,105],"driven":[79],"efficient":[80],"fine-tuning":[81,122],"that":[85,113],"can":[86],"take":[87],"an":[88],"off-the-shelf":[89],"yield":[94],"highly":[95],"for":[98,123],"downstream":[99,139],"tasks.":[100],"specific,":[102],"perform":[104],"analysis":[106],"rank":[108],"each":[109],"individual":[110],"parameter":[111,126,157],"tensor,":[112],"then":[114],"is":[115],"used":[116],"trim":[118],"them":[119],"accordingly":[120],"during":[121],"given":[125],"or":[127,155],"FLOPs":[128],"budget.":[129],"Our":[130],"experiments":[131],"show":[132],"efficacy":[134],"Sensi-BERT":[136],"across":[137],"different":[138],"including":[141],"MNLI,":[142],"QQP,":[143],"QNLI,":[144],"SST-2,":[145],"MRPC,":[146],"CoLA,":[147],"SQuAD,":[149],"showing":[150],"better":[151],"at":[153],"similar":[154],"smaller":[156],"budget":[158],"compared":[159],"alternatives.":[162]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
