{"id":"https://openalex.org/W4402435320","doi":"https://doi.org/10.1109/access.2024.3457863","title":"A Generalist Reinforcement Learning Agent for Compressing Multiple Convolutional Networks Using Singular Value Decomposition","display_name":"A Generalist Reinforcement Learning Agent for Compressing Multiple Convolutional Networks Using Singular Value Decomposition","publication_year":2024,"publication_date":"2024-01-01","ids":{"openalex":"https://openalex.org/W4402435320","doi":"https://doi.org/10.1109/access.2024.3457863"},"language":"en","primary_location":{"id":"doi:10.1109/access.2024.3457863","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1109/access.2024.3457863","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"http://dx.doi.org/10.1109/access.2024.3457863","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5095044475","display_name":"Gabriel Gonzalez-Sahagun","orcid":"https://orcid.org/0009-0009-7931-4654"},"institutions":[{"id":"https://openalex.org/I98461037","display_name":"Tecnol\u00f3gico de Monterrey","ror":"https://ror.org/03ayjn504","country_code":"MX","type":"education","lineage":["https://openalex.org/I98461037"]}],"countries":["MX"],"is_corresponding":true,"raw_author_name":"Gabriel Gonzalez-Sahagun","raw_affiliation_strings":["School of Engineering and Sciences, Tecnologico de Monterrey, Monterrey, Nuevo Leon, Mexico","Tecnologico de Monterrey, School of Engineering and Sciences, Monterrey, Nuevo Leon, Mexico"],"affiliations":[{"raw_affiliation_string":"School of Engineering and Sciences, Tecnologico de Monterrey, Monterrey, Nuevo Leon, Mexico","institution_ids":["https://openalex.org/I98461037"]},{"raw_affiliation_string":"Tecnologico de Monterrey, School of Engineering and Sciences, Monterrey, Nuevo Leon, Mexico","institution_ids":["https://openalex.org/I98461037"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028807044","display_name":"Santiago Enrique Conant-Pablos","orcid":"https://orcid.org/0000-0001-6270-3164"},"institutions":[{"id":"https://openalex.org/I98461037","display_name":"Tecnol\u00f3gico de Monterrey","ror":"https://ror.org/03ayjn504","country_code":"MX","type":"education","lineage":["https://openalex.org/I98461037"]}],"countries":["MX"],"is_corresponding":false,"raw_author_name":"Santiago Enrique Conant-Pablos","raw_affiliation_strings":["School of Engineering and Sciences, Tecnologico de Monterrey, Monterrey, Nuevo Leon, Mexico","Tecnologico de Monterrey, School of Engineering and Sciences, Monterrey, Nuevo Leon, Mexico"],"affiliations":[{"raw_affiliation_string":"School of Engineering and Sciences, Tecnologico de Monterrey, Monterrey, Nuevo Leon, Mexico","institution_ids":["https://openalex.org/I98461037"]},{"raw_affiliation_string":"Tecnologico de Monterrey, School of Engineering and Sciences, Monterrey, Nuevo Leon, Mexico","institution_ids":["https://openalex.org/I98461037"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027131130","display_name":"Jos\u00e9 Carlos Ort\u00edz-Bayliss","orcid":"https://orcid.org/0000-0003-3408-2166"},"institutions":[{"id":"https://openalex.org/I98461037","display_name":"Tecnol\u00f3gico de Monterrey","ror":"https://ror.org/03ayjn504","country_code":"MX","type":"education","lineage":["https://openalex.org/I98461037"]}],"countries":["MX"],"is_corresponding":false,"raw_author_name":"Jos\u00e9 Carlos Ortiz-Bayliss","raw_affiliation_strings":["School of Engineering and Sciences, Tecnologico de Monterrey, Monterrey, Nuevo Leon, Mexico","Tecnologico de Monterrey, School of Engineering and Sciences, Monterrey, Nuevo Leon, Mexico"],"affiliations":[{"raw_affiliation_string":"School of Engineering and Sciences, Tecnologico de Monterrey, Monterrey, Nuevo Leon, Mexico","institution_ids":["https://openalex.org/I98461037"]},{"raw_affiliation_string":"Tecnologico de Monterrey, School of Engineering and Sciences, Monterrey, Nuevo Leon, Mexico","institution_ids":["https://openalex.org/I98461037"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5086193689","display_name":"Jorge M. Cruz\u2010Duarte","orcid":"https://orcid.org/0000-0003-4494-7864"},"institutions":[{"id":"https://openalex.org/I98461037","display_name":"Tecnol\u00f3gico de Monterrey","ror":"https://ror.org/03ayjn504","country_code":"MX","type":"education","lineage":["https://openalex.org/I98461037"]}],"countries":["MX"],"is_corresponding":false,"raw_author_name":"Jorge M. Cruz-Duarte","raw_affiliation_strings":["School of Engineering and Sciences, Tecnologico de Monterrey, Monterrey, Nuevo Leon, Mexico","Tecnologico de Monterrey, School of Engineering and Sciences, Monterrey, Nuevo Leon, Mexico"],"affiliations":[{"raw_affiliation_string":"School of Engineering and Sciences, Tecnologico de Monterrey, Monterrey, Nuevo Leon, Mexico","institution_ids":["https://openalex.org/I98461037"]},{"raw_affiliation_string":"Tecnologico de Monterrey, School of Engineering and Sciences, Monterrey, Nuevo Leon, Mexico","institution_ids":["https://openalex.org/I98461037"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5095044475"],"corresponding_institution_ids":["https://openalex.org/I98461037"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.34,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.65960274,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":"12","issue":null,"first_page":"136131","last_page":"136147"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.840399980545044,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.840399980545044,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8445861339569092},{"id":"https://openalex.org/keywords/singular-value-decomposition","display_name":"Singular value decomposition","score":0.6675094962120056},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6530553698539734},{"id":"https://openalex.org/keywords/decomposition","display_name":"Decomposition","score":0.5879971981048584},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.48424383997917175},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.412127822637558},{"id":"https://openalex.org/keywords/composite-material","display_name":"Composite material","score":0.10939809679985046},{"id":"https://openalex.org/keywords/materials-science","display_name":"Materials science","score":0.10726886987686157},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.06066820025444031}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8445861339569092},{"id":"https://openalex.org/C22789450","wikidata":"https://www.wikidata.org/wiki/Q420904","display_name":"Singular value decomposition","level":2,"score":0.6675094962120056},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6530553698539734},{"id":"https://openalex.org/C124681953","wikidata":"https://www.wikidata.org/wiki/Q339062","display_name":"Decomposition","level":2,"score":0.5879971981048584},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.48424383997917175},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.412127822637558},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.10939809679985046},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.10726886987686157},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.06066820025444031},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2024.3457863","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1109/access.2024.3457863","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:dfcac66038704835858a82b8a2f6170e","is_oa":true,"landing_page_url":"https://doaj.org/article/dfcac66038704835858a82b8a2f6170e","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 12, Pp 136131-136147 (2024)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2024.3457863","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1109/access.2024.3457863","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10","score":0.4300000071525574}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2920061524","https://openalex.org/W4310083477","https://openalex.org/W2328553770","https://openalex.org/W1977959518","https://openalex.org/W2038908348","https://openalex.org/W2107890255","https://openalex.org/W2106552856","https://openalex.org/W2145821588","https://openalex.org/W2086122291","https://openalex.org/W1987513656"],"abstract_inverted_index":{"Deep":[0],"learning":[1,82],"models":[2,16,88,95],"have":[3,39],"gained":[4],"popularity":[5],"in":[6,23,142],"the":[7,44,52,65,72,103,108,135,147,154,163,167,181,188,209],"last":[8],"decade":[9],"for":[10,47,78,111,161,220,223],"computer":[11],"vision":[12],"tasks.":[13],"Although":[14],"these":[15,48,68],"are":[17],"widely":[18],"used,":[19],"they":[20],"process":[21,63],"data":[22],"cloud":[24],"services":[25],"due":[26],"to":[27,42,55,89,92,113,140,177,198,214],"requiring":[28],"large":[29],"amounts":[30],"of":[31,67,126,137,146,149,171,200,218],"memory":[32,45],"unavailable":[33],"on":[34,196],"consumer":[35],"devices.":[36],"Multiple":[37],"techniques":[38,69],"been":[40],"proposed":[41],"reduce":[43],"needed":[46],"models.":[49],"Nonetheless,":[50],"finding":[51],"best":[53],"method":[54],"compress":[56,93,114,178],"each":[57,150,172],"model":[58,83,117,132,194],"can":[59,118],"be":[60,119],"a":[61,76,80,115,124,131,143,193,221],"time-consuming":[62],"as":[64],"parameters":[66],"significantly":[70],"affect":[71],"results.":[73],"We":[74,152],"propose":[75],"methodology":[77],"training":[79],"reinforcement":[81],"that":[84],"exploits":[85],"similarities":[86],"between":[87],"select":[90],"how":[91,112],"other":[94],"it":[96],"has":[97],"not":[98],"seen":[99],"before.":[100],"By":[101],"reusing":[102],"generalist":[104,210],"agent":[105,122,175,211],"and":[106,129,165],"exploiting":[107],"similarities,":[109],"searching":[110,219],"new":[116],"avoided.":[120],"The":[121],"receives":[123],"set":[125],"feature":[127,155],"maps":[128,156],"compresses":[130],"by":[133,157],"choosing":[134],"percentage":[136],"singular":[138],"values":[139],"use":[141],"low-rank":[144],"factorization":[145],"weights":[148],"layer.":[151],"chose":[153],"generating":[158],"an":[159],"embedding":[160],"all":[162],"images":[164],"selecting":[166],"most":[168],"representative":[169],"image":[170],"class.":[173],"Our":[174],"trained":[176,183,195],"two":[179],"models,":[180],"first":[182],"using":[184,190],"fashion":[185],"MNIST,":[186],"whereas":[187],"second,":[189],"Kuzushiji-MNIST,":[191],"reduced":[192],"MNIST":[197],"15%":[199],"its":[201],"original":[202],"size":[203],"with":[204],"minimal":[205],"accuracy":[206],"loss.":[207],"Reusing":[208],"permitted":[212],"us":[213],"skip":[215],"4.6":[216],"days":[217],"solution":[222],"MNIST.":[224]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-04-09T06:08:40.794217","created_date":"2025-10-10T00:00:00"}
