{"id":"https://openalex.org/W4404486469","doi":"https://doi.org/10.1109/jstsp.2024.3501685","title":"DARIO: Differentiable Vision Transformer Pruning With Low-Cost Proxies","display_name":"DARIO: Differentiable Vision Transformer Pruning With Low-Cost Proxies","publication_year":2024,"publication_date":"2024-09-01","ids":{"openalex":"https://openalex.org/W4404486469","doi":"https://doi.org/10.1109/jstsp.2024.3501685"},"language":"en","primary_location":{"id":"doi:10.1109/jstsp.2024.3501685","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jstsp.2024.3501685","pdf_url":null,"source":{"id":"https://openalex.org/S42167783","display_name":"IEEE Journal of Selected Topics in Signal Processing","issn_l":"1932-4553","issn":["1932-4553","1941-0484"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Journal of Selected Topics in Signal Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://hdl.handle.net/10818/63362","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102912726","display_name":"Haozhe Sun","orcid":"https://orcid.org/0009-0000-7202-2223"},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I1326498283","display_name":"Institut national de recherche en sciences et technologies du num\u00e9rique","ror":"https://ror.org/02kvxyf05","country_code":"FR","type":"government","lineage":["https://openalex.org/I1326498283"]},{"id":"https://openalex.org/I277688954","display_name":"Universit\u00e9 Paris-Saclay","ror":"https://ror.org/03xjwb503","country_code":"FR","type":"education","lineage":["https://openalex.org/I277688954"]},{"id":"https://openalex.org/I4210126360","display_name":"Centre Inria de Saclay","ror":"https://ror.org/0315e5x55","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1326498283","https://openalex.org/I4210126360"]},{"id":"https://openalex.org/I4387152856","display_name":"Laboratoire Interdisciplinaire des Sciences du Num\u00e9rique","ror":"https://ror.org/00rd81916","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I277688954","https://openalex.org/I4387152856"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Haozhe Sun","raw_affiliation_strings":["LISN, INRIA, CNRS, Universit&#x00E9; Paris-Saclay, Gif-sur-Yvette, France","LISN, INRIA, CNRS, Universite Paris-Saclay, France"],"raw_orcid":"https://orcid.org/0009-0000-7202-2223","affiliations":[{"raw_affiliation_string":"LISN, INRIA, CNRS, Universit&#x00E9; Paris-Saclay, Gif-sur-Yvette, France","institution_ids":["https://openalex.org/I4210126360","https://openalex.org/I277688954","https://openalex.org/I1294671590","https://openalex.org/I4387152856"]},{"raw_affiliation_string":"LISN, INRIA, CNRS, Universite Paris-Saclay, France","institution_ids":["https://openalex.org/I277688954","https://openalex.org/I1326498283","https://openalex.org/I1294671590","https://openalex.org/I4387152856"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081018738","display_name":"Alexandre Heuillet","orcid":"https://orcid.org/0000-0003-2109-7895"},"institutions":[{"id":"https://openalex.org/I277688954","display_name":"Universit\u00e9 Paris-Saclay","ror":"https://ror.org/03xjwb503","country_code":"FR","type":"education","lineage":["https://openalex.org/I277688954"]},{"id":"https://openalex.org/I4210107733","display_name":"Informatique, BioInformatique, Syst\u00e8mes Complexes","ror":"https://ror.org/01aqxgr98","country_code":"FR","type":"facility","lineage":["https://openalex.org/I277688954","https://openalex.org/I277688954","https://openalex.org/I4210107733","https://openalex.org/I88467170"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Alexandre Heuillet","raw_affiliation_strings":["IBISC, Univ Evry, Universit&#x00E9; Paris-Saclay, Gif-sur-Yvette, France","IBISC, Univ Evry, Universite Paris-Saclay, France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IBISC, Univ Evry, Universit&#x00E9; Paris-Saclay, Gif-sur-Yvette, France","institution_ids":["https://openalex.org/I4210107733","https://openalex.org/I277688954"]},{"raw_affiliation_string":"IBISC, Univ Evry, Universite Paris-Saclay, France","institution_ids":["https://openalex.org/I4210107733","https://openalex.org/I277688954"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032411139","display_name":"Felix Mohr","orcid":"https://orcid.org/0000-0002-9293-2424"},"institutions":[{"id":"https://openalex.org/I157650460","display_name":"Universidad de La Sabana","ror":"https://ror.org/02sqgkj21","country_code":"CO","type":"education","lineage":["https://openalex.org/I157650460"]}],"countries":["CO"],"is_corresponding":false,"raw_author_name":"Felix Mohr","raw_affiliation_strings":["Universidad de la Sabana, Ch&#x00ED;a, Colombia","Universidad de la Sabana, Ch&#x0131;a, Colombia"],"raw_orcid":"https://orcid.org/0000-0002-9293-2424","affiliations":[{"raw_affiliation_string":"Universidad de la Sabana, Ch&#x00ED;a, Colombia","institution_ids":["https://openalex.org/I157650460"]},{"raw_affiliation_string":"Universidad de la Sabana, Ch&#x0131;a, Colombia","institution_ids":["https://openalex.org/I157650460"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5107633038","display_name":"Hedi Tabia","orcid":"https://orcid.org/0000-0002-1827-7150"},"institutions":[{"id":"https://openalex.org/I277688954","display_name":"Universit\u00e9 Paris-Saclay","ror":"https://ror.org/03xjwb503","country_code":"FR","type":"education","lineage":["https://openalex.org/I277688954"]},{"id":"https://openalex.org/I4210107733","display_name":"Informatique, BioInformatique, Syst\u00e8mes Complexes","ror":"https://ror.org/01aqxgr98","country_code":"FR","type":"facility","lineage":["https://openalex.org/I277688954","https://openalex.org/I277688954","https://openalex.org/I4210107733","https://openalex.org/I88467170"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Hedi Tabia","raw_affiliation_strings":["IBISC, Univ Evry, Universit&#x00E9; Paris-Saclay, Gif-sur-Yvette, France","IBISC, Univ Evry, Universite Paris-Saclay, France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IBISC, Univ Evry, Universit&#x00E9; Paris-Saclay, Gif-sur-Yvette, France","institution_ids":["https://openalex.org/I4210107733","https://openalex.org/I277688954"]},{"raw_affiliation_string":"IBISC, Univ Evry, Universite Paris-Saclay, France","institution_ids":["https://openalex.org/I4210107733","https://openalex.org/I277688954"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.4367,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.64093195,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":98},"biblio":{"volume":"18","issue":"6","first_page":"997","last_page":"1009"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9731000065803528,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9731000065803528,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.9635999798774719,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9623000025749207,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/differentiable-function","display_name":"Differentiable function","score":0.6569456458091736},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5624881982803345},{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.5314447283744812},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5310271978378296},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4982123374938965},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.4504285454750061},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3295971751213074},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2951759696006775},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.12580859661102295},{"id":"https://openalex.org/keywords/mathematical-analysis","display_name":"Mathematical analysis","score":0.0951697826385498}],"concepts":[{"id":"https://openalex.org/C202615002","wikidata":"https://www.wikidata.org/wiki/Q783507","display_name":"Differentiable function","level":2,"score":0.6569456458091736},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5624881982803345},{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.5314447283744812},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5310271978378296},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4982123374938965},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.4504285454750061},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3295971751213074},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2951759696006775},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.12580859661102295},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0951697826385498},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/jstsp.2024.3501685","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jstsp.2024.3501685","pdf_url":null,"source":{"id":"https://openalex.org/S42167783","display_name":"IEEE Journal of Selected Topics in Signal Processing","issn_l":"1932-4553","issn":["1932-4553","1941-0484"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Journal of Selected Topics in Signal Processing","raw_type":"journal-article"},{"id":"pmh:oai:HAL:hal-04813053v1","is_oa":false,"landing_page_url":"https://univ-evry.hal.science/hal-04813053","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Journal of Selected Topics in Signal Processing, 2024, 18 (6), pp.997--1009. &#x27E8;10.1109/JSTSP.2024.3501685&#x27E9;","raw_type":"Journal articles"},{"id":"pmh:oai:intellectum.unisabana.edu.co:10818/63362","is_oa":true,"landing_page_url":"https://hdl.handle.net/10818/63362","pdf_url":null,"source":{"id":"https://openalex.org/S4306401748","display_name":"Intellectum (Universidad de La Sabana)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I157650460","host_organization_name":"Universidad de La Sabana","host_organization_lineage":["https://openalex.org/I157650460"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"publishedVersion"}],"best_oa_location":{"id":"pmh:oai:intellectum.unisabana.edu.co:10818/63362","is_oa":true,"landing_page_url":"https://hdl.handle.net/10818/63362","pdf_url":null,"source":{"id":"https://openalex.org/S4306401748","display_name":"Intellectum (Universidad de La Sabana)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I157650460","host_organization_name":"Universidad de La Sabana","host_organization_lineage":["https://openalex.org/I157650460"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"publishedVersion"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320326542","display_name":"Universidad de La Sabana","ror":"https://ror.org/02sqgkj21"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":58,"referenced_works":["https://openalex.org/W1982825626","https://openalex.org/W2050883661","https://openalex.org/W2117539524","https://openalex.org/W2140132917","https://openalex.org/W2194775991","https://openalex.org/W2922073769","https://openalex.org/W2955051405","https://openalex.org/W2962677625","https://openalex.org/W2962851801","https://openalex.org/W2964081807","https://openalex.org/W2965862774","https://openalex.org/W3083021344","https://openalex.org/W3096727283","https://openalex.org/W3116594510","https://openalex.org/W3154851733","https://openalex.org/W3164008977","https://openalex.org/W3184606595","https://openalex.org/W3193542387","https://openalex.org/W4206281850","https://openalex.org/W4206634569","https://openalex.org/W4226126941","https://openalex.org/W4283811336","https://openalex.org/W4285805347","https://openalex.org/W4313156423","https://openalex.org/W4365446402","https://openalex.org/W4385482786","https://openalex.org/W4385958936","https://openalex.org/W4386065441","https://openalex.org/W4386083031","https://openalex.org/W4396926906","https://openalex.org/W6638523607","https://openalex.org/W6670227514","https://openalex.org/W6677103964","https://openalex.org/W6677580257","https://openalex.org/W6726275242","https://openalex.org/W6729956949","https://openalex.org/W6745519486","https://openalex.org/W6751979845","https://openalex.org/W6752515464","https://openalex.org/W6757817989","https://openalex.org/W6759263581","https://openalex.org/W6762945437","https://openalex.org/W6766275931","https://openalex.org/W6774375107","https://openalex.org/W6779460946","https://openalex.org/W6784333009","https://openalex.org/W6787352875","https://openalex.org/W6788034315","https://openalex.org/W6788713141","https://openalex.org/W6796652220","https://openalex.org/W6798029099","https://openalex.org/W6800633732","https://openalex.org/W6802648153","https://openalex.org/W6810362000","https://openalex.org/W6839423864","https://openalex.org/W6849849255","https://openalex.org/W6852962002","https://openalex.org/W6853496605"],"related_works":["https://openalex.org/W4285277090","https://openalex.org/W4327738859","https://openalex.org/W2348722996","https://openalex.org/W2334570605","https://openalex.org/W3181683615","https://openalex.org/W4286826125","https://openalex.org/W1633485514","https://openalex.org/W1604739066","https://openalex.org/W2115878407","https://openalex.org/W1980454230"],"abstract_inverted_index":{"Transformer":[0],"models":[1,11],"have":[2],"gained":[3],"popularity":[4],"for":[5],"their":[6],"exceptional":[7],"performance.":[8],"However,":[9],"these":[10],"still":[12],"face":[13],"the":[14,22,112,150,154],"challenge":[15],"of":[16,25,60,116],"high":[17],"inference":[18,125],"latency.":[19],"To":[20],"improve":[21],"computational":[23],"efficiency":[24,115,126],"such":[26],"models,":[27,95],"we":[28],"propose":[29],"a":[30,58,73],"novel":[31],"differentiable":[32],"pruning":[33,75],"method":[34],"called":[35],"DARIO":[36,71,88,118,120,137],"(<bold":[37],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[38,40,45,47,52],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">D</b>ifferenti<bold":[39],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">A</b>ble":[41],"vision":[42],"transformer":[43],"p<bold":[44],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">R</b>un<bold":[46],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">I</b>ng":[48],"with":[49],"low-cost":[50,68],"pr<bold":[51],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">O</b>xies).":[53],"Our":[54],"approach":[55],"involves":[56],"optimizing":[57],"set":[59],"gating":[61],"parameters":[62],"using":[63],"differentiable,":[64],"data-agnostic,":[65],"scale-invariant,":[66],"and":[67,100,114,153],"performance":[69],"proxies.":[70],"is":[72],"data-agnostic":[74],"method,":[76],"it":[77],"does":[78],"not":[79,121],"need":[80],"any":[81],"classification":[82,155],"heads":[83],"during":[84],"pruning.":[85],"We":[86],"evaluated":[87],"on":[89,127,145],"two":[90],"popular":[91],"state-of-the-art":[92],"pre-trained":[93],"ViT":[94],"including":[96],"both":[97],"large":[98],"(MAE-ViT)":[99],"small":[101],"(MobileViT)":[102],"sizes.":[103],"Extensive":[104],"experiments":[105],"conducted":[106],"across":[107],"40":[108],"diverse":[109],"datasets":[110],"demonstrated":[111],"effectiveness":[113],"our":[117],"method.":[119],"only":[122,148],"significantly":[123],"improves":[124],"modern":[128],"hardware":[129],"but":[130],"also":[131],"excels":[132],"in":[133,143],"preserving":[134],"accuracy.":[135],"Notably,":[136],"has":[138],"even":[139],"achieved":[140],"an":[141],"increase":[142],"accuracy":[144],"MobileViT,":[146],"despite":[147],"fine-tuning":[149],"last":[151],"block":[152],"head.":[156]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2026-06-12T08:23:45.883708","created_date":"2025-10-10T00:00:00"}
