{"id":"https://openalex.org/W3013844214","doi":"https://doi.org/10.1109/ieeeconf44664.2019.9048845","title":"Generalization, Adaptation and Low-Rank Representation in Neural Networks","display_name":"Generalization, Adaptation and Low-Rank Representation in Neural Networks","publication_year":2019,"publication_date":"2019-11-01","ids":{"openalex":"https://openalex.org/W3013844214","doi":"https://doi.org/10.1109/ieeeconf44664.2019.9048845","mag":"3013844214"},"language":"en","primary_location":{"id":"doi:10.1109/ieeeconf44664.2019.9048845","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ieeeconf44664.2019.9048845","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 53rd Asilomar Conference on Signals, Systems, and Computers","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5050547472","display_name":"Samet Oymak","orcid":"https://orcid.org/0000-0001-5203-0752"},"institutions":[{"id":"https://openalex.org/I103635307","display_name":"University of California, Riverside","ror":"https://ror.org/03nawhv43","country_code":"US","type":"education","lineage":["https://openalex.org/I103635307"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Samet Oymak","raw_affiliation_strings":["Department of Electrical and Computer Engineering, University of California, Riverside"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, University of California, Riverside","institution_ids":["https://openalex.org/I103635307"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088599790","display_name":"Zalan Fabian","orcid":null},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zalan Fabian","raw_affiliation_strings":["Ming Hsieh Department of Electrical Engineering, University of Southern California"],"affiliations":[{"raw_affiliation_string":"Ming Hsieh Department of Electrical Engineering, University of Southern California","institution_ids":["https://openalex.org/I1174212"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074422516","display_name":"Mingchen Li","orcid":"https://orcid.org/0000-0002-0736-1541"},"institutions":[{"id":"https://openalex.org/I103635307","display_name":"University of California, Riverside","ror":"https://ror.org/03nawhv43","country_code":"US","type":"education","lineage":["https://openalex.org/I103635307"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mingchen Li","raw_affiliation_strings":["Department of Computer Science and Engineering, University of California, Riverside"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, University of California, Riverside","institution_ids":["https://openalex.org/I103635307"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5046962187","display_name":"Mahdi Soltanolkotabi","orcid":"https://orcid.org/0000-0003-2101-6418"},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mahdi Soltanolkotabi","raw_affiliation_strings":["Ming Hsieh Department of Electrical Engineering, University of Southern California"],"affiliations":[{"raw_affiliation_string":"Ming Hsieh Department of Electrical Engineering, University of Southern California","institution_ids":["https://openalex.org/I1174212"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5050547472"],"corresponding_institution_ids":["https://openalex.org/I103635307"],"apc_list":null,"apc_paid":null,"fwci":0.2878,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.48496241,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"581","last_page":"585"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12303","display_name":"Tensor decomposition and applications","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/2605","display_name":"Computational Mathematics"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12303","display_name":"Tensor decomposition and applications","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/2605","display_name":"Computational Mathematics"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10500","display_name":"Sparse and Compressive Sensing Techniques","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/jacobian-matrix-and-determinant","display_name":"Jacobian matrix and determinant","score":0.9494025707244873},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.8983135223388672},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.674618661403656},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6560350656509399},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.6413151025772095},{"id":"https://openalex.org/keywords/rank","display_name":"Rank (graph theory)","score":0.612354040145874},{"id":"https://openalex.org/keywords/principal","display_name":"Principal (computer security)","score":0.6009073853492737},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5619321465492249},{"id":"https://openalex.org/keywords/early-stopping","display_name":"Early stopping","score":0.5003981590270996},{"id":"https://openalex.org/keywords/recurrent-neural-network","display_name":"Recurrent neural network","score":0.43089205026626587},{"id":"https://openalex.org/keywords/matrix","display_name":"Matrix (chemical analysis)","score":0.4272882044315338},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.4229786992073059},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.37875255942344666},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3658927083015442},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3600252866744995},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2357657253742218},{"id":"https://openalex.org/keywords/applied-mathematics","display_name":"Applied mathematics","score":0.10733217000961304}],"concepts":[{"id":"https://openalex.org/C200331156","wikidata":"https://www.wikidata.org/wiki/Q506041","display_name":"Jacobian matrix and determinant","level":2,"score":0.9494025707244873},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.8983135223388672},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.674618661403656},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6560350656509399},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.6413151025772095},{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.612354040145874},{"id":"https://openalex.org/C144559511","wikidata":"https://www.wikidata.org/wiki/Q2986279","display_name":"Principal (computer security)","level":2,"score":0.6009073853492737},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5619321465492249},{"id":"https://openalex.org/C5465570","wikidata":"https://www.wikidata.org/wiki/Q5326898","display_name":"Early stopping","level":3,"score":0.5003981590270996},{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.43089205026626587},{"id":"https://openalex.org/C106487976","wikidata":"https://www.wikidata.org/wiki/Q685816","display_name":"Matrix (chemical analysis)","level":2,"score":0.4272882044315338},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4229786992073059},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.37875255942344666},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3658927083015442},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3600252866744995},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2357657253742218},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.10733217000961304},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ieeeconf44664.2019.9048845","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ieeeconf44664.2019.9048845","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 53rd Asilomar Conference on Signals, Systems, and Computers","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.44999998807907104,"display_name":"Industry, innovation and infrastructure","id":"https://metadata.un.org/sdg/9"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":58,"referenced_works":["https://openalex.org/W2626325961","https://openalex.org/W2804589149","https://openalex.org/W2806970110","https://openalex.org/W2809090039","https://openalex.org/W2886067286","https://openalex.org/W2894604724","https://openalex.org/W2895492274","https://openalex.org/W2897097528","https://openalex.org/W2900103278","https://openalex.org/W2900959181","https://openalex.org/W2904838594","https://openalex.org/W2905800572","https://openalex.org/W2911867426","https://openalex.org/W2921467542","https://openalex.org/W2927724204","https://openalex.org/W2938647293","https://openalex.org/W2941057241","https://openalex.org/W2949582403","https://openalex.org/W2949804919","https://openalex.org/W2949960976","https://openalex.org/W2962916883","https://openalex.org/W2963239103","https://openalex.org/W2963622172","https://openalex.org/W2963837241","https://openalex.org/W2970330753","https://openalex.org/W2995354826","https://openalex.org/W3021189130","https://openalex.org/W3031885728","https://openalex.org/W3093329015","https://openalex.org/W3137695714","https://openalex.org/W3152114226","https://openalex.org/W4288593476","https://openalex.org/W4289293816","https://openalex.org/W4289436733","https://openalex.org/W4297813530","https://openalex.org/W4299971819","https://openalex.org/W6729595453","https://openalex.org/W6739706309","https://openalex.org/W6751100130","https://openalex.org/W6752009368","https://openalex.org/W6752125765","https://openalex.org/W6752495264","https://openalex.org/W6753918066","https://openalex.org/W6755150206","https://openalex.org/W6755308174","https://openalex.org/W6755511848","https://openalex.org/W6756137178","https://openalex.org/W6756867819","https://openalex.org/W6757685903","https://openalex.org/W6758902322","https://openalex.org/W6759176382","https://openalex.org/W6760242218","https://openalex.org/W6761561157","https://openalex.org/W6762156623","https://openalex.org/W6763485134","https://openalex.org/W6763845970","https://openalex.org/W6765762003","https://openalex.org/W6768793533"],"related_works":["https://openalex.org/W2007405763","https://openalex.org/W3136087161","https://openalex.org/W1486373823","https://openalex.org/W2119578520","https://openalex.org/W2053762185","https://openalex.org/W2913611334","https://openalex.org/W1984283682","https://openalex.org/W3216339657","https://openalex.org/W3013844214","https://openalex.org/W3161646234"],"abstract_inverted_index":{"We":[0,97,115],"develop":[1],"a":[2,66,142],"data-dependent":[3],"optimization":[4],"and":[5,29,35,38,42,61,84,128,147,167,173],"generalization":[6,30,90],"theory":[7],"for":[8],"neural":[9,101,136],"networks":[10,102,122,137],"which":[11],"leverages":[12],"the":[13,16,21,50,54,78,92,112,132,154,160],"lowrankness":[14],"of":[15,53,94,111,134,153],"Jacobian":[17,55,113,133,169],"matrix":[18,56],"associated":[19],"with":[20,68,89,141],"network.":[22],"Our":[23],"results":[24],"help":[25,88],"demystify":[26],"why":[27],"training":[28,70,81],"is":[31,59,82,165],"easier":[32],"on":[33,40,120,159],"clean":[34],"structured":[36],"datasets":[37],"harder":[39],"noisy":[41],"unstructured":[43],"datasets.":[44],"Specifically,":[45],"we":[46],"show":[47],"that":[48,72,123],"over":[49,107,171],"principal":[51,161],"eigendirections":[52,162],"space":[57],"learning":[58,164],"fast":[60],"one":[62],"can":[63,73,87,103],"quickly":[64],"train":[65],"model":[67],"zero":[69],"loss":[71],"also":[74,98],"generalize":[75],"well.":[76],"Over":[77],"smaller":[79],"eigendirections,":[80],"slower":[83],"early":[85],"stopping":[86],"at":[91],"expense":[93],"some":[95],"bias.":[96],"discuss":[99],"how":[100],"learn":[104,174],"better":[105,175],"representations":[106],"time":[108,172],"in":[109],"terms":[110],"mapping.":[114],"conduct":[116],"various":[117],"numerical":[118],"experiments":[119],"deep":[121],"corroborate":[124],"our":[125],"theoretical":[126],"findings":[127],"demonstrate":[129],"that:":[130],"(i)":[131],"typical":[135],"exhibit":[138],"low-rank":[139],"structure":[140],"few":[143],"large":[144],"singular":[145],"values":[146],"many":[148],"small":[149],"ones,":[150],"(ii)":[151],"most":[152],"useful":[155],"label":[156],"information":[157],"lies":[158],"where":[163],"fast,":[166],"(iii)":[168],"adapts":[170],"representations.":[176]},"counts_by_year":[{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
