{"id":"https://openalex.org/W2889084551","doi":"https://doi.org/10.1109/ssp.2018.8450819","title":"Simultaneous Sparsity and Parameter Tying for Deep Learning Using Ordered Weighted \u21131 Regularization","display_name":"Simultaneous Sparsity and Parameter Tying for Deep Learning Using Ordered Weighted \u21131 Regularization","publication_year":2018,"publication_date":"2018-06-01","ids":{"openalex":"https://openalex.org/W2889084551","doi":"https://doi.org/10.1109/ssp.2018.8450819","mag":"2889084551"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/ssp.2018.8450819","pdf_url":null,"source":null,"license":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5091676855","display_name":"Dejiao Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I27837315","display_name":"University of Michigan\u2013Ann Arbor","ror":"https://ror.org/00jmfr291","country_code":"US","type":"education","lineage":["https://openalex.org/I27837315"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dejiao Zhang","raw_affiliation_string":"Department of.Electrical Engineering and Computer Science, University of Michigan, Ann Arbor","raw_affiliation_strings":["Department of.Electrical Engineering and Computer Science, University of Michigan, Ann Arbor"]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066883909","display_name":"Julian Katz-Samuels","orcid":null},"institutions":[{"id":"https://openalex.org/I27837315","display_name":"University of Michigan\u2013Ann Arbor","ror":"https://ror.org/00jmfr291","country_code":"US","type":"education","lineage":["https://openalex.org/I27837315"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Julian Katz-Samuels","raw_affiliation_string":"Department of.Electrical Engineering and Computer Science, University of Michigan, Ann Arbor","raw_affiliation_strings":["Department of.Electrical Engineering and Computer Science, University of Michigan, Ann Arbor"]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026826555","display_name":"M\u00e1rio A. T. Figueiredo","orcid":"https://orcid.org/0000-0002-0970-7745"},"institutions":[{"id":"https://openalex.org/I4210120471","display_name":"Instituto de Telecomunica\u00e7\u00f5es","ror":"https://ror.org/02ht4fk33","country_code":"PT","type":"nonprofit","lineage":["https://openalex.org/I4210120471"]},{"id":"https://openalex.org/I141596103","display_name":"University of Lisbon","ror":"https://ror.org/01c27hj86","country_code":"PT","type":"education","lineage":["https://openalex.org/I141596103"]}],"countries":["PT"],"is_corresponding":false,"raw_author_name":"Mario A.T. Figueiredo","raw_affiliation_string":"Instituto de Telecomunica\u00e7\u00f5es and Instituto Superior Tecnico, Universidade de Lisboa, Portugal","raw_affiliation_strings":["Instituto de Telecomunica\u00e7\u00f5es and Instituto Superior Tecnico, Universidade de Lisboa, Portugal"]},{"author_position":"last","author":{"id":"https://openalex.org/A5029521003","display_name":"Laura Balzano","orcid":"https://orcid.org/0000-0003-2914-123X"},"institutions":[{"id":"https://openalex.org/I27837315","display_name":"University of Michigan\u2013Ann Arbor","ror":"https://ror.org/00jmfr291","country_code":"US","type":"education","lineage":["https://openalex.org/I27837315"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Laura Balzano","raw_affiliation_string":"Department of.Electrical Engineering and Computer Science, University of Michigan, Ann Arbor","raw_affiliation_strings":["Department of.Electrical Engineering and Computer Science, University of Michigan, Ann Arbor"]}],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":2,"cited_by_percentile_year":{"min":75,"max":78},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10500","display_name":"Theory and Applications of Compressed Sensing","score":0.9995,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10500","display_name":"Theory and Applications of Compressed Sensing","score":0.9995,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12676","display_name":"Theory and Applications of Extreme Learning Machines","score":0.9985,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Advances in Transfer Learning and Domain Adaptation","score":0.9947,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"keyword":"parameter tying","score":0.4562},{"keyword":"deep learning","score":0.4533},{"keyword":"ordered weighted","score":0.2756}],"concepts":[{"id":"https://openalex.org/C2776135515","wikidata":"https://www.wikidata.org/wiki/Q17143721","display_name":"Regularization (linguistics)","level":2,"score":0.71760017},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6820584},{"id":"https://openalex.org/C2780938662","wikidata":"https://www.wikidata.org/wiki/Q973710","display_name":"Tying","level":2,"score":0.61700636},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.5628613},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.55885583},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.542218},{"id":"https://openalex.org/C119043178","wikidata":"https://www.wikidata.org/wiki/Q320723","display_name":"Covariate","level":2,"score":0.5110925},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.4871971},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.48349243},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4387887},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.43225437},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.42648673},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.40114015},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.35148668},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.26222572},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.13767457},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/ssp.2018.8450819","pdf_url":null,"source":null,"license":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[],"grants":[],"referenced_works_count":9,"referenced_works":["https://openalex.org/W1916786071","https://openalex.org/W1949314668","https://openalex.org/W2012653948","https://openalex.org/W2109449402","https://openalex.org/W2112796928","https://openalex.org/W2122825543","https://openalex.org/W2145607950","https://openalex.org/W2963696951","https://openalex.org/W4244393449"],"related_works":["https://openalex.org/W2294590153","https://openalex.org/W4220659530","https://openalex.org/W2998037107","https://openalex.org/W1569871744","https://openalex.org/W2379437105","https://openalex.org/W2016024526","https://openalex.org/W3139928442","https://openalex.org/W1567336638","https://openalex.org/W3124892642","https://openalex.org/W3125367266"],"ngrams_url":"https://api.openalex.org/works/W2889084551/ngrams","abstract_inverted_index":{"A":[0],"deep":[1,106],"neural":[2],"network":[3,116],"(DNN)":[4],"usually":[5],"contains":[6],"millions":[7],"of":[8,88],"parameters,":[9],"making":[10],"both":[11],"storage":[12],"and":[13],"computation":[14],"extremely":[15],"expensive.":[16],"Although":[17],"this":[18,36],"high":[19],"capacity":[20],"allows":[21],"DNNs":[22],"to":[23,32,80,95],"learn":[24],"sophisticated":[25],"mappings,":[26],"it":[27,111],"also":[28,83],"makes":[29],"them":[30],"prone":[31],"over-fitting.":[33],"To":[34],"tackle":[35],"issue,":[37],"we":[38],"adopt":[39],"a":[40,96],"recently":[41],"proposed":[42],"sparsity-inducing":[43,69],"regularizer":[44,103],"called":[45],"OWL":[46,71,102],"(ordered":[47],"weighted":[48],"\u2113":[49],"1":[52],",":[53],"which":[54],"has":[55],"proven":[56],"effective":[57],"in":[58],"sparse":[59],"linear":[60],"regression":[61],"with":[62,117],"strongly":[63],"correlated":[64,86],"covariates.":[65],"Unlike":[66],"the":[67,92,101,115],"conventional":[68],"regularizers,":[70],"simultaneously":[72],"eliminates":[73],"unimportant":[74],"variables":[75,89],"by":[76,90],"setting":[77],"their":[78],"weights":[79,94],"zero,":[81],"while":[82],"explicitly":[84],"identifying":[85],"groups":[87],"tying":[91],"corresponding":[93],"common":[97],"value.":[98],"We":[99],"evaluate":[100],"on":[104,123],"several":[105],"learning":[107],"benchmarks,":[108],"showing":[109],"that":[110],"can":[112],"dramatically":[113],"compress":[114],"slight":[118],"or":[119],"even":[120],"no":[121],"loss":[122],"generalization":[124],"accuracy.":[125]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2889084551","counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2021,"cited_by_count":1}],"updated_date":"2024-03-20T02:23:06.357876","created_date":"2018-09-07"}