{"id":"https://openalex.org/W4387848667","doi":"https://doi.org/10.1145/3583780.3614904","title":"Hadamard Adapter: An Extreme Parameter-Efficient Adapter Tuning Method for Pre-trained Language Models","display_name":"Hadamard Adapter: An Extreme Parameter-Efficient Adapter Tuning Method for Pre-trained Language Models","publication_year":2023,"publication_date":"2023-10-21","ids":{"openalex":"https://openalex.org/W4387848667","doi":"https://doi.org/10.1145/3583780.3614904"},"language":"en","primary_location":{"id":"doi:10.1145/3583780.3614904","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3583780.3614904","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Information and Knowledge Management","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5060201245","display_name":"Yuyan Chen","orcid":"https://orcid.org/0009-0003-5888-5518"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yuyan Chen","raw_affiliation_strings":["Shanghai Key Laboratory of Data Science, School of Computer Science, Fudan University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0002-4381-486X","affiliations":[{"raw_affiliation_string":"Shanghai Key Laboratory of Data Science, School of Computer Science, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086820941","display_name":"Qiang Fu","orcid":"https://orcid.org/0000-0002-5821-7267"},"institutions":[{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qiang Fu","raw_affiliation_strings":["Microsoft, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-5821-7267","affiliations":[{"raw_affiliation_string":"Microsoft, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101589508","display_name":"Ge Fan","orcid":"https://orcid.org/0000-0001-5653-1626"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ge Fan","raw_affiliation_strings":["Tencent, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0001-5653-1626","affiliations":[{"raw_affiliation_string":"Tencent, Shenzhen, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008387608","display_name":"Lun Du","orcid":"https://orcid.org/0000-0002-7625-0650"},"institutions":[{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lun Du","raw_affiliation_strings":["Microsoft, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-7625-0650","affiliations":[{"raw_affiliation_string":"Microsoft, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025118710","display_name":"Jian\u2013Guang Lou","orcid":null},"institutions":[{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jian-Guang Lou","raw_affiliation_strings":["Microsoft, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-8496-033X","affiliations":[{"raw_affiliation_string":"Microsoft, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006300825","display_name":"Shi Han","orcid":"https://orcid.org/0000-0002-0360-6089"},"institutions":[{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shi Han","raw_affiliation_strings":["Microsoft, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-0360-6089","affiliations":[{"raw_affiliation_string":"Microsoft, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100331488","display_name":"Dongmei Zhang","orcid":"https://orcid.org/0000-0002-9230-2799"},"institutions":[{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dongmei Zhang","raw_affiliation_strings":["Microsoft, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-9230-2799","affiliations":[{"raw_affiliation_string":"Microsoft, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065529268","display_name":"Zhixu Li","orcid":"https://orcid.org/0000-0003-2355-288X"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhixu Li","raw_affiliation_strings":["Shanghai Key Laboratory of Data Science, School of Computer Science, Fudan University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0003-2355-288X","affiliations":[{"raw_affiliation_string":"Shanghai Key Laboratory of Data Science, School of Computer Science, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5090455375","display_name":"Yanghua Xiao","orcid":"https://orcid.org/0000-0001-8403-9591"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanghua Xiao","raw_affiliation_strings":["Shanghai Key Laboratory of Data Science, School of Computer Science, Fudan University &amp; Fudan-Aishu Cognitive Intelligence Joint Research Center, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0001-8403-9591","affiliations":[{"raw_affiliation_string":"Shanghai Key Laboratory of Data Science, School of Computer Science, Fudan University &amp; Fudan-Aishu Cognitive Intelligence Joint Research Center, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5060201245"],"corresponding_institution_ids":["https://openalex.org/I24943067"],"apc_list":null,"apc_paid":null,"fwci":2.3477,"has_fulltext":false,"cited_by_count":14,"citation_normalized_percentile":{"value":0.90867041,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"276","last_page":"285"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9922000169754028,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9729999899864197,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/adapter","display_name":"Adapter (computing)","score":0.9594703912734985},{"id":"https://openalex.org/keywords/hadamard-transform","display_name":"Hadamard transform","score":0.7043105363845825},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6690413951873779},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.34015634655952454},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.3328932225704193},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.32028084993362427},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.2789970636367798},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.16780850291252136}],"concepts":[{"id":"https://openalex.org/C177284502","wikidata":"https://www.wikidata.org/wiki/Q1005390","display_name":"Adapter (computing)","level":2,"score":0.9594703912734985},{"id":"https://openalex.org/C60292330","wikidata":"https://www.wikidata.org/wiki/Q1014065","display_name":"Hadamard transform","level":2,"score":0.7043105363845825},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6690413951873779},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.34015634655952454},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.3328932225704193},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.32028084993362427},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.2789970636367798},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.16780850291252136},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3583780.3614904","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3583780.3614904","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Information and Knowledge Management","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W1724438581","https://openalex.org/W1821462560","https://openalex.org/W2134797427","https://openalex.org/W2181101938","https://openalex.org/W2233116163","https://openalex.org/W2560674852","https://openalex.org/W2766839578","https://openalex.org/W2799054028","https://openalex.org/W2896457183","https://openalex.org/W2964217848","https://openalex.org/W2965373594","https://openalex.org/W3033187248","https://openalex.org/W3103616906","https://openalex.org/W3153675281","https://openalex.org/W3168867926","https://openalex.org/W3173788106","https://openalex.org/W3174770825","https://openalex.org/W3176468671","https://openalex.org/W3176828726","https://openalex.org/W3199761064","https://openalex.org/W4205991051","https://openalex.org/W4206178588","https://openalex.org/W4221154357","https://openalex.org/W4225619898","https://openalex.org/W4238846128","https://openalex.org/W4280534475","https://openalex.org/W4286903741","https://openalex.org/W4286981949","https://openalex.org/W4287123286","https://openalex.org/W4287796851","https://openalex.org/W4287824654","https://openalex.org/W4288088047","https://openalex.org/W4288089799","https://openalex.org/W4292779060","https://openalex.org/W4297790889","https://openalex.org/W4297795751","https://openalex.org/W4300081896","https://openalex.org/W4385245566"],"related_works":["https://openalex.org/W2133028525","https://openalex.org/W4229060448","https://openalex.org/W4306381730","https://openalex.org/W2981692913","https://openalex.org/W3044188621","https://openalex.org/W3184035966","https://openalex.org/W2160602540","https://openalex.org/W2485605994","https://openalex.org/W4385571108","https://openalex.org/W4200251711"],"abstract_inverted_index":{"Recent":[0],"years,":[1],"Pre-trained":[2],"Language":[3],"models":[4],"(PLMs)":[5],"have":[6,26],"swept":[7],"into":[8],"various":[9,124],"fields":[10],"of":[11,30,47,61],"artificial":[12],"intelligence":[13],"and":[14,24,37,40,170],"achieved":[15],"great":[16],"success.":[17],"However,":[18],"most":[19],"PLMs,":[20],"such":[21],"as":[22,99],"T5":[23],"GPT3,":[25],"a":[27,45,55,77],"huge":[28],"amount":[29],"parameters,":[31],"fine-tuning":[32,64],"them":[33,42],"is":[34,51,186],"often":[35],"expensive":[36],"time":[38],"consuming,":[39],"storing":[41],"takes":[43],"up":[44],"lot":[46],"space.":[48],"Therefore,":[49],"it":[50,171],"necessary":[52],"to":[53,58,107,128,199],"adopt":[54],"parameter-efficient":[56,109],"approach":[57],"reduce":[59],"parameters":[60,105,165,175],"PLMs":[62,153],"in":[63,69,86,139,191],"without":[65],"compromising":[66],"their":[67],"performance":[68,161],"downstream":[70,125],"tasks.":[71],"In":[72,111],"this":[73],"paper,":[74],"we":[75,113,181],"design":[76],"novel":[78],"adapter":[79,89,121,158,194],"which":[80,195],"only":[81,163,205],"acts":[82],"on":[83,145],"self-attention":[84],"outputs":[85],"PLMs.":[87],"This":[88],"adopts":[90],"element-wise":[91],"linear":[92],"transformation":[93],"using":[94],"Hadamard":[95,100,120,157,193],"product,":[96],"hence":[97],"named":[98],"adapter,":[101],"requires":[102],"the":[103,146,156,173,192],"fewest":[104,174],"compared":[106,166,176],"previous":[108],"adapters.":[110,179],"addition,":[112],"also":[114,187],"summarize":[115],"some":[116,130,188],"tuning":[117],"patterns":[118],"for":[119,132],"shared":[122,137],"by":[123],"tasks,":[126],"expecting":[127],"provide":[129],"guidance":[131],"further":[133,182],"parameter":[134,202],"reduction":[135],"with":[136,150,162,167,177,204],"adapters":[138],"future":[140],"studies.":[141],"The":[142],"experiments":[143],"conducted":[144],"widely-used":[147],"GLUE":[148],"benchmark":[149],"several":[151],"SOTA":[152],"prove":[154],"that":[155,184],"achieves":[159],"competitive":[160],"0.033%":[164],"full":[168],"fine-tuning,":[169],"has":[172],"other":[178],"Moreover,":[180],"find":[183],"there":[185],"redundant":[189],"layers":[190],"can":[196],"be":[197],"removed":[198],"achieve":[200],"more":[201],"efficiency":[203],"0.022%":[206],"parameters.":[207]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":7}],"updated_date":"2026-05-09T13:55:54.758798","created_date":"2025-10-10T00:00:00"}
