{"id":"https://openalex.org/W4411553033","doi":"https://doi.org/10.1145/3733566.3734432","title":"TOU: A Truncated-factorized reduction for a lightweight fine-tuning method","display_name":"TOU: A Truncated-factorized reduction for a lightweight fine-tuning method","publication_year":2025,"publication_date":"2025-06-23","ids":{"openalex":"https://openalex.org/W4411553033","doi":"https://doi.org/10.1145/3733566.3734432"},"language":"en","primary_location":{"id":"doi:10.1145/3733566.3734432","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3733566.3734432","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 6th Workshop on Intelligent Cross-Data Analysis and Retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3733566.3734432","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5055365497","display_name":"Phuc Binh Nguyen","orcid":null},"institutions":[{"id":"https://openalex.org/I90023481","display_name":"National Institute of Information and Communications Technology","ror":"https://ror.org/016bgq349","country_code":"JP","type":"facility","lineage":["https://openalex.org/I90023481"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Phuong Thi-Mai Nguyen","raw_affiliation_strings":["Big Data Integration Center National Institute of Information and Communications Technology, Tokyo, Japan"],"raw_orcid":"https://orcid.org/0009-0006-8970-8823","affiliations":[{"raw_affiliation_string":"Big Data Integration Center National Institute of Information and Communications Technology, Tokyo, Japan","institution_ids":["https://openalex.org/I90023481"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5048072689","display_name":"Koji Zettsu","orcid":"https://orcid.org/0000-0003-4062-2376"},"institutions":[{"id":"https://openalex.org/I90023481","display_name":"National Institute of Information and Communications Technology","ror":"https://ror.org/016bgq349","country_code":"JP","type":"facility","lineage":["https://openalex.org/I90023481"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Koji Zettsu","raw_affiliation_strings":["Big Data Integration Center National Institute of Information and Communications Technology, Tokyo, Japan"],"raw_orcid":"https://orcid.org/0000-0003-4062-2376","affiliations":[{"raw_affiliation_string":"Big Data Integration Center National Institute of Information and Communications Technology, Tokyo, Japan","institution_ids":["https://openalex.org/I90023481"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5055365497"],"corresponding_institution_ids":["https://openalex.org/I90023481"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.06786164,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"38","last_page":"45"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9886999726295471,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9886999726295471,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9807999730110168,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9470999836921692,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reduction","display_name":"Reduction (mathematics)","score":0.7697805166244507},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6616541147232056},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.41392242908477783},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.37150442600250244},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.21071887016296387},{"id":"https://openalex.org/keywords/geometry","display_name":"Geometry","score":0.05641987919807434}],"concepts":[{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.7697805166244507},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6616541147232056},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.41392242908477783},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.37150442600250244},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.21071887016296387},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.05641987919807434}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3733566.3734432","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3733566.3734432","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 6th Workshop on Intelligent Cross-Data Analysis and Retrieval","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3733566.3734432","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3733566.3734432","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 6th Workshop on Intelligent Cross-Data Analysis and Retrieval","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W2066043610","https://openalex.org/W2612690371","https://openalex.org/W2754084392","https://openalex.org/W2914304175","https://openalex.org/W2963026768","https://openalex.org/W2963912046","https://openalex.org/W2990138404","https://openalex.org/W3034238904","https://openalex.org/W3035646933","https://openalex.org/W3099793224","https://openalex.org/W3169483174","https://openalex.org/W3174770825","https://openalex.org/W3176828726","https://openalex.org/W4205991051","https://openalex.org/W4283809320","https://openalex.org/W4307044600"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2051487156","https://openalex.org/W2073681303","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2352590024"],"abstract_inverted_index":{"The":[0],"full":[1,99,166,183,224],"fine-tuning":[2,79,138,257],"pre-trained":[3,52],"models":[4,173],"represents":[5],"an":[6],"effective":[7,165],"approach.":[8],"But":[9],"it":[10],"typically":[11],"requires":[12],"the":[13,68,72,83,93,98,105,135,145,187,256,261],"updating":[14,97],"of":[15,92,107,118,171,211,218,236],"all":[16],"model":[17,141,190,258],"parameters,":[18],"which":[19],"can":[20],"result":[21],"in":[22,23,116,148,198,209,216,234,254],"computational":[24,262],"and":[25,120,140,152,164,214,239],"memory":[26,219,240],"costs.":[27],"To":[28],"address":[29],"this":[30],"challenge,":[31],"we":[32,129],"present":[33],"a":[34,40,125,131,159,195],"methodology":[35,41],"called":[36],"Truncated-factorized":[37],"reduction":[38,197],"(TOU),":[39],"that":[42,156,192],"leverages":[43],"Truncated":[44],"Singular":[45],"Value":[46],"Decomposition":[47],"(TSVD)":[48],"to":[49,77,113,133,154,174,181,223,244],"factorize":[50],"each":[51],"weight":[53,85,225],"matrix":[54,90],"into":[55],"two":[56,94],"smaller":[57],"matrices.":[58],"One":[59],"factor":[60,74],"is":[61,75],"strategically":[62],"frozen,":[63],"preserving":[64],"core":[65],"knowledge":[66],"from":[67],"pre-train":[69],"phase,":[70],"while":[71,177,201],"other":[73],"subjected":[76],"standard":[78],"procedures.":[80],"After":[81],"fine-tuning,":[82,111,167],"original":[84],"matrices":[86],"are":[87],"reconstructed":[88],"by":[89,123,143,259],"multiplication":[91],"factors,":[95],"effectively":[96],"weights.":[100],"This":[101,250],"method":[102],"significantly":[103],"reduces":[104,207],"number":[106],"trainable":[108,199],"parameters":[109,200],"during":[110],"leading":[112],"enhanced":[114],"efficiency":[115,127,139],"terms":[117,210,217,235],"computation":[119],"memory.":[121],"Furthermore,":[122,227],"introducing":[124],"novelty":[126],"parameter,":[128],"provide":[130],"mechanism":[132],"control":[134],"trade-off":[136],"between":[137],"adaptability":[142],"adjusting":[144],"truncation":[146],"level":[147],"TSVD.":[149],"We":[150],"hypothesize":[151],"aim":[153],"demonstrate":[155],"TOU":[157,193,228],"offers":[158],"compelling":[160],"strategy":[161],"for":[162],"efficient":[163],"enabling":[168],"faster":[169],"adaptation":[170],"large":[172],"new":[175],"tasks":[176],"maintaining":[178,202],"performance":[179,222,231],"compared":[180],"traditional":[182],"fine-tuning.":[184,226],"Experiments":[185],"on":[186],"Vision":[188],"Transformer":[189],"show":[191],"achieves":[194],"70%":[196],"(accuracy":[203],"drops":[204],"<":[205],"1%),":[206],"65%":[208],"training":[212,237],"time,":[213],"27%":[215],"usage":[220,241],"comparable":[221,248],"delivers":[229],"better":[230],"than":[232],"LoRA":[233],"speed":[238],"when":[242],"applied":[243],"fine-tune":[245],"GPT-2M":[246],"with":[247,265],"performance.":[249],"approach":[251],"holds":[252],"promise":[253],"accelerating":[255],"reducing":[260],"burden":[263],"associated":[264],"their":[266],"downstream":[267],"application.":[268]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
