{"id":"https://openalex.org/W4414693378","doi":"https://doi.org/10.1109/tpami.2025.3616318","title":"DTL: Parameter- and Memory-Efficient Disentangled Vision Learning","display_name":"DTL: Parameter- and Memory-Efficient Disentangled Vision Learning","publication_year":2025,"publication_date":"2025-10-01","ids":{"openalex":"https://openalex.org/W4414693378","doi":"https://doi.org/10.1109/tpami.2025.3616318","pmid":"https://pubmed.ncbi.nlm.nih.gov/41032539"},"language":"en","primary_location":{"id":"doi:10.1109/tpami.2025.3616318","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2025.3616318","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5020218182","display_name":"Minghao Fu","orcid":"https://orcid.org/0000-0002-4685-6600"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Minghao Fu","raw_affiliation_strings":["National Key Laboratory for Novel Software Technology and School of Artificial Intelligence, Nanjing University, Nanjing, China","National Key Laboratory for Novel Software Technology, Nanjing University, China"],"raw_orcid":"https://orcid.org/0000-0002-4685-6600","affiliations":[{"raw_affiliation_string":"National Key Laboratory for Novel Software Technology and School of Artificial Intelligence, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]},{"raw_affiliation_string":"National Key Laboratory for Novel Software Technology, Nanjing University, China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Ke Zhu","orcid":"https://orcid.org/0009-0007-6338-4151"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ke Zhu","raw_affiliation_strings":["National Key Laboratory for Novel Software Technology and School of Artificial Intelligence, Nanjing University, Nanjing, China","National Key Laboratory for Novel Software Technology, Nanjing University, China"],"raw_orcid":"https://orcid.org/0009-0007-6338-4151","affiliations":[{"raw_affiliation_string":"National Key Laboratory for Novel Software Technology and School of Artificial Intelligence, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]},{"raw_affiliation_string":"National Key Laboratory for Novel Software Technology, Nanjing University, China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Zonghao Ding","orcid":"https://orcid.org/0009-0009-1933-1428"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zonghao Ding","raw_affiliation_strings":["National Key Laboratory for Novel Software Technology and School of Artificial Intelligence, Nanjing University, Nanjing, China","National Key Laboratory for Novel Software Technology, Nanjing University, China"],"raw_orcid":"https://orcid.org/0009-0009-1933-1428","affiliations":[{"raw_affiliation_string":"National Key Laboratory for Novel Software Technology and School of Artificial Intelligence, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]},{"raw_affiliation_string":"National Key Laboratory for Novel Software Technology, Nanjing University, China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5090881698","display_name":"Jianxin Wu","orcid":"https://orcid.org/0000-0002-2085-7568"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianxin Wu","raw_affiliation_strings":["National Key Laboratory for Novel Software Technology and School of Artificial Intelligence, Nanjing University, Nanjing, China","National Key Laboratory for Novel Software Technology, Nanjing University, China"],"raw_orcid":"https://orcid.org/0000-0002-2085-7568","affiliations":[{"raw_affiliation_string":"National Key Laboratory for Novel Software Technology and School of Artificial Intelligence, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]},{"raw_affiliation_string":"National Key Laboratory for Novel Software Technology, Nanjing University, China","institution_ids":["https://openalex.org/I881766915"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5020218182"],"corresponding_institution_ids":["https://openalex.org/I881766915"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.13582084,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"48","issue":"2","first_page":"1736","last_page":"1749"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9857000112533569,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9857000112533569,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12676","display_name":"Machine Learning and ELM","score":0.9693999886512756,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9641000032424927,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/margin","display_name":"Margin (machine learning)","score":0.7767000198364258},{"id":"https://openalex.org/keywords/transfer-of-learning","display_name":"Transfer of learning","score":0.5706999897956848},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.5647000074386597},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.5552999973297119},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5307999849319458},{"id":"https://openalex.org/keywords/memory-footprint","display_name":"Memory footprint","score":0.5110999941825867},{"id":"https://openalex.org/keywords/downstream","display_name":"Downstream (manufacturing)","score":0.4717999994754791},{"id":"https://openalex.org/keywords/cognitive-neuroscience-of-visual-object-recognition","display_name":"Cognitive neuroscience of visual object recognition","score":0.4390999972820282},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.4334999918937683}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8562999963760376},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.7767000198364258},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6930999755859375},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.5706999897956848},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.5647000074386597},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.5552999973297119},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5307999849319458},{"id":"https://openalex.org/C74912251","wikidata":"https://www.wikidata.org/wiki/Q6815727","display_name":"Memory footprint","level":2,"score":0.5110999941825867},{"id":"https://openalex.org/C2776207758","wikidata":"https://www.wikidata.org/wiki/Q5303302","display_name":"Downstream (manufacturing)","level":2,"score":0.4717999994754791},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.44020000100135803},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.4390999972820282},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.4334999918937683},{"id":"https://openalex.org/C132943942","wikidata":"https://www.wikidata.org/wiki/Q2562511","display_name":"Footprint","level":2,"score":0.4138999879360199},{"id":"https://openalex.org/C2776175482","wikidata":"https://www.wikidata.org/wiki/Q1195816","display_name":"Transfer (computing)","level":2,"score":0.4025999903678894},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.38109999895095825},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.37779998779296875},{"id":"https://openalex.org/C88796919","wikidata":"https://www.wikidata.org/wiki/Q1142907","display_name":"Backbone network","level":2,"score":0.37040001153945923},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.3443000018596649},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.32089999318122864},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.31859999895095825},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3131999969482422},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.296999990940094},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.2784999907016754},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.27459999918937683},{"id":"https://openalex.org/C22367795","wikidata":"https://www.wikidata.org/wiki/Q7625208","display_name":"Structured prediction","level":2,"score":0.2718999981880188},{"id":"https://openalex.org/C2776960227","wikidata":"https://www.wikidata.org/wiki/Q2586354","display_name":"Knowledge transfer","level":2,"score":0.2567000091075897},{"id":"https://openalex.org/C5339829","wikidata":"https://www.wikidata.org/wiki/Q1425977","display_name":"Machine vision","level":2,"score":0.2547999918460846},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.2547999918460846},{"id":"https://openalex.org/C2781195486","wikidata":"https://www.wikidata.org/wiki/Q289436","display_name":"Texture (cosmology)","level":3,"score":0.25049999356269836}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tpami.2025.3616318","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2025.3616318","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},{"id":"pmid:41032539","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/41032539","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on pattern analysis and machine intelligence","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4824364784","display_name":null,"funder_award_id":"62276123","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G528746023","display_name":null,"funder_award_id":"61921006","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W1861492603","https://openalex.org/W2037227137","https://openalex.org/W2108598243","https://openalex.org/W2165698076","https://openalex.org/W2194775991","https://openalex.org/W2531409750","https://openalex.org/W2737258237","https://openalex.org/W3138516171","https://openalex.org/W3176828726","https://openalex.org/W4225410153","https://openalex.org/W4312310776","https://openalex.org/W4312651322","https://openalex.org/W4313156423","https://openalex.org/W4313175608","https://openalex.org/W4382463911","https://openalex.org/W4385245566","https://openalex.org/W4385573520","https://openalex.org/W4386065763","https://openalex.org/W4386072470","https://openalex.org/W4386083036","https://openalex.org/W4386415485","https://openalex.org/W4386790226","https://openalex.org/W4390872773","https://openalex.org/W4390873054","https://openalex.org/W4390873881","https://openalex.org/W4390874497","https://openalex.org/W4393148714","https://openalex.org/W4393159845","https://openalex.org/W4400580599","https://openalex.org/W4401109685","https://openalex.org/W4402754189","https://openalex.org/W4402916137","https://openalex.org/W4403488721","https://openalex.org/W4403791725","https://openalex.org/W4413146904","https://openalex.org/W4413979290"],"related_works":[],"abstract_inverted_index":{"The":[0],"cost":[1,25],"of":[2,32,68,160,169],"finetuning":[3],"a":[4,29,66,97,109,150,166,183],"pretrained":[5],"model":[6],"on":[7],"downstream":[8,130],"tasks":[9,140],"steadily":[10],"increases":[11],"as":[12,142],"they":[13],"grow":[14],"larger.":[15],"Parameter-efficient":[16],"transfer":[17,127],"learning":[18],"(PETL)":[19],"is":[20,42],"proposed":[21],"to":[22,72,120,137],"reduce":[23],"this":[24,80],"by":[26,148,182],"changing":[27],"only":[28,164],"tiny":[30],"subset":[31],"trainable":[33,52,91,174],"parameters.":[34],"But,":[35],"the":[36,62,90,94,117,121,158],"GPU":[37,170],"memory":[38,171],"footprint":[39],"during":[40],"training":[41],"not":[43,163],"effectively":[44,124],"reduced":[45],"in":[46,128,186],"PETL.":[47],"This":[48],"issue":[49],"happens":[50],"because":[51],"parameters":[53,92],"from":[54,93],"these":[55],"methods":[56,181],"are":[57],"generally":[58],"tightly":[59],"entangled":[60],"with":[61,108],"backbone,":[63,122],"such":[64,141],"that":[65],"lot":[67],"intermediate":[69],"states":[70],"have":[71],"be":[73],"stored":[74],"for":[75],"back":[76,119],"propagation.":[77],"To":[78],"alleviate":[79],"issue,":[81],"we":[82],"introduce":[83],"Disentangled":[84],"Transfer":[85],"Learning":[86],"(DTL),":[87],"which":[88,162],"disentangles":[89],"backbone":[95],"using":[96],"lightweight":[98],"Compact":[99],"Side":[100],"Network":[101],"(CSN).":[102],"By":[103],"progressively":[104],"extracting":[105],"task-specific":[106],"information":[107,118],"few":[110],"low-rank":[111],"linear":[112],"mappings":[113],"and":[114,145,173],"appropriately":[115],"adding":[116],"CSN":[123],"realizes":[125],"knowledge":[126],"various":[129],"recognition":[131],"tasks.":[132],"We":[133],"further":[134],"extend":[135],"DTL":[136],"more":[138,151],"difficult":[139],"object":[143],"detection":[144],"semantic":[146],"segmentation":[147],"employing":[149],"sparse":[152],"architectural":[153],"design.":[154],"Extensive":[155],"experiments":[156],"validate":[157],"effectiveness":[159],"DTL,":[161],"reduces":[165],"large":[167],"amount":[168],"usage":[172],"parameters,":[175],"but":[176],"also":[177],"outperforms":[178],"existing":[179],"PETL":[180],"significant":[184],"margin":[185],"accuracy.":[187]},"counts_by_year":[],"updated_date":"2026-01-11T23:08:45.486102","created_date":"2025-10-10T00:00:00"}
