{"id":"https://openalex.org/W3176637778","doi":"https://doi.org/10.1162/neco_a_01483","title":"Understanding Dynamics of Nonlinear Representation Learning and Its Application","display_name":"Understanding Dynamics of Nonlinear Representation Learning and Its Application","publication_year":2022,"publication_date":"2022-03-02","ids":{"openalex":"https://openalex.org/W3176637778","doi":"https://doi.org/10.1162/neco_a_01483","mag":"3176637778","pmid":"https://pubmed.ncbi.nlm.nih.gov/35231929"},"language":"en","primary_location":{"id":"doi:10.1162/neco_a_01483","is_oa":true,"landing_page_url":"https://doi.org/10.1162/neco_a_01483","pdf_url":"https://direct.mit.edu/neco/article-pdf/34/4/991/2003085/neco_a_01483.pdf","source":{"id":"https://openalex.org/S207023548","display_name":"Neural Computation","issn_l":"0899-7667","issn":["0899-7667","1530-888X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310315718","host_organization_name":"The MIT Press","host_organization_lineage":["https://openalex.org/P4310315718"],"host_organization_lineage_names":["The MIT Press"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Neural Computation","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://direct.mit.edu/neco/article-pdf/34/4/991/2003085/neco_a_01483.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5003184366","display_name":"Kenji Kawaguchi","orcid":"https://orcid.org/0000-0002-5361-9793"},"institutions":[{"id":"https://openalex.org/I136199984","display_name":"Harvard University","ror":"https://ror.org/03vek6s52","country_code":"US","type":"education","lineage":["https://openalex.org/I136199984"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Kenji Kawaguchi","raw_affiliation_strings":["Harvard University, Cambridge, MA 02138, U.S.A. kkawaguchi@fas.harvard.edu"],"affiliations":[{"raw_affiliation_string":"Harvard University, Cambridge, MA 02138, U.S.A. kkawaguchi@fas.harvard.edu","institution_ids":["https://openalex.org/I136199984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115593378","display_name":"Linjun Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I102322142","display_name":"Rutgers, The State University of New Jersey","ror":"https://ror.org/05vt9qd57","country_code":"US","type":"education","lineage":["https://openalex.org/I102322142"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Linjun Zhang","raw_affiliation_strings":["Rutgers University, New Brunswick, NJ 08901 linjun.zhang@rutgers.edu"],"affiliations":[{"raw_affiliation_string":"Rutgers University, New Brunswick, NJ 08901 linjun.zhang@rutgers.edu","institution_ids":["https://openalex.org/I102322142"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5006488129","display_name":"Zhun Deng","orcid":"https://orcid.org/0009-0002-3785-8513"},"institutions":[{"id":"https://openalex.org/I2801851002","display_name":"Harvard University Press","ror":"https://ror.org/006v7bf86","country_code":"US","type":"other","lineage":["https://openalex.org/I136199984","https://openalex.org/I2801851002"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Zhun Deng","raw_affiliation_strings":["Harvard University Cambridge, MA 02138, U.S.A. zhundeng@g.harvard.edu"],"affiliations":[{"raw_affiliation_string":"Harvard University Cambridge, MA 02138, U.S.A. zhundeng@g.harvard.edu","institution_ids":["https://openalex.org/I2801851002"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5003184366","https://openalex.org/A5006488129","https://openalex.org/A5115593378"],"corresponding_institution_ids":["https://openalex.org/I102322142","https://openalex.org/I136199984","https://openalex.org/I2801851002"],"apc_list":null,"apc_paid":null,"fwci":0.276,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.59876996,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"34","issue":"4","first_page":"991","last_page":"1018"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12676","display_name":"Machine Learning and ELM","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6796313524246216},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.6496461033821106},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5893508195877075},{"id":"https://openalex.org/keywords/raw-data","display_name":"Raw data","score":0.5736581087112427},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5224648714065552},{"id":"https://openalex.org/keywords/nonlinear-system","display_name":"Nonlinear system","score":0.5167005062103271},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5057170391082764},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.45617035031318665},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.41395482420921326}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6796313524246216},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.6496461033821106},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5893508195877075},{"id":"https://openalex.org/C132964779","wikidata":"https://www.wikidata.org/wiki/Q2110223","display_name":"Raw data","level":2,"score":0.5736581087112427},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5224648714065552},{"id":"https://openalex.org/C158622935","wikidata":"https://www.wikidata.org/wiki/Q660848","display_name":"Nonlinear system","level":2,"score":0.5167005062103271},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5057170391082764},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.45617035031318665},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.41395482420921326},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C50522688","wikidata":"https://www.wikidata.org/wiki/Q189833","display_name":"Economic growth","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001185","descriptor_name":"Artificial Intelligence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D001185","descriptor_name":"Artificial Intelligence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D001185","descriptor_name":"Artificial Intelligence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D007858","descriptor_name":"Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D007858","descriptor_name":"Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D007858","descriptor_name":"Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":3,"locations":[{"id":"doi:10.1162/neco_a_01483","is_oa":true,"landing_page_url":"https://doi.org/10.1162/neco_a_01483","pdf_url":"https://direct.mit.edu/neco/article-pdf/34/4/991/2003085/neco_a_01483.pdf","source":{"id":"https://openalex.org/S207023548","display_name":"Neural Computation","issn_l":"0899-7667","issn":["0899-7667","1530-888X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310315718","host_organization_name":"The MIT Press","host_organization_lineage":["https://openalex.org/P4310315718"],"host_organization_lineage_names":["The MIT Press"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Neural Computation","raw_type":"journal-article"},{"id":"pmid:35231929","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/35231929","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Neural computation","raw_type":null},{"id":"pmh:oai:arXiv.org:2106.14836","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2106.14836","pdf_url":"https://arxiv.org/pdf/2106.14836","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"doi:10.1162/neco_a_01483","is_oa":true,"landing_page_url":"https://doi.org/10.1162/neco_a_01483","pdf_url":"https://direct.mit.edu/neco/article-pdf/34/4/991/2003085/neco_a_01483.pdf","source":{"id":"https://openalex.org/S207023548","display_name":"Neural Computation","issn_l":"0899-7667","issn":["0899-7667","1530-888X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310315718","host_organization_name":"The MIT Press","host_organization_lineage":["https://openalex.org/P4310315718"],"host_organization_lineage_names":["The MIT Press"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Neural Computation","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3176637778.pdf","grobid_xml":"https://content.openalex.org/works/W3176637778.grobid-xml"},"referenced_works_count":59,"referenced_works":["https://openalex.org/W22861983","https://openalex.org/W54257720","https://openalex.org/W71795751","https://openalex.org/W1596986901","https://openalex.org/W1677182931","https://openalex.org/W1738124305","https://openalex.org/W1993882792","https://openalex.org/W2002454301","https://openalex.org/W2076094076","https://openalex.org/W2101234009","https://openalex.org/W2103305545","https://openalex.org/W2103359087","https://openalex.org/W2110798204","https://openalex.org/W2112796928","https://openalex.org/W2125930537","https://openalex.org/W2136922672","https://openalex.org/W2141125852","https://openalex.org/W2147768505","https://openalex.org/W2160815625","https://openalex.org/W2163605009","https://openalex.org/W2163922914","https://openalex.org/W2166093887","https://openalex.org/W2168013545","https://openalex.org/W2187386544","https://openalex.org/W2215006509","https://openalex.org/W2250379827","https://openalex.org/W2302255633","https://openalex.org/W2335728318","https://openalex.org/W2394932179","https://openalex.org/W2434635047","https://openalex.org/W2475287302","https://openalex.org/W2559655401","https://openalex.org/W2596585349","https://openalex.org/W2604272474","https://openalex.org/W2604721644","https://openalex.org/W2782476368","https://openalex.org/W2798909945","https://openalex.org/W2902986194","https://openalex.org/W2911153392","https://openalex.org/W2919115771","https://openalex.org/W2963446085","https://openalex.org/W2963504252","https://openalex.org/W2964072429","https://openalex.org/W2970971581","https://openalex.org/W2990138404","https://openalex.org/W2995553068","https://openalex.org/W3103357424","https://openalex.org/W3118608800","https://openalex.org/W3125148525","https://openalex.org/W3156245182","https://openalex.org/W3162402566","https://openalex.org/W3170945223","https://openalex.org/W3175491950","https://openalex.org/W6669713995","https://openalex.org/W6675354045","https://openalex.org/W6701575323","https://openalex.org/W6750968397","https://openalex.org/W6772121514","https://openalex.org/W7047167133"],"related_works":["https://openalex.org/W2055243143","https://openalex.org/W2062195135","https://openalex.org/W3012838233","https://openalex.org/W4252510819","https://openalex.org/W4321636575","https://openalex.org/W2330446075","https://openalex.org/W1986418932","https://openalex.org/W2357796999","https://openalex.org/W2045526782","https://openalex.org/W2741131631"],"abstract_inverted_index":{"Representations":[0],"of":[1,25,33,96,106,200],"the":[2,23,94,115,120,126,130,141,164,168,183,214,239],"world":[3],"environment":[4],"play":[5],"a":[6,54,84,104,107,111,178,191,195,208,235],"crucial":[7],"role":[8],"in":[9,22,167],"artificial":[10],"intelligence.":[11],"It":[12],"is":[13,135,245],"often":[14],"inefficient":[15],"to":[16,39,137,248],"conduct":[17],"reasoning":[18],"and":[19,110,119,144,154,160,232,268,282],"inference":[20],"directly":[21],"space":[24],"raw":[26,45,51],"sensory":[27,46,52],"representations,":[28],"such":[29,97],"as":[30,190],"pixel":[31],"values":[32],"images.":[34],"Representation":[35],"learning":[36],"allows":[37],"us":[38],"automatically":[40,223],"discover":[41],"suitable":[42],"representations":[43,60],"from":[44],"data.":[47],"For":[48],"example,":[49,182],"given":[50,226],"data,":[53],"deep":[55,260],"neural":[56,262],"network":[57,157],"learns":[58],"nonlinear":[59,99],"at":[61,73],"its":[62,74,242],"hidden":[63],"layers,":[64],"which":[65,212],"are":[66],"subsequently":[67],"used":[68,189],"for":[69,140,146,176,181,193,259],"classification":[70],"(or":[71],"regression)":[72],"output":[75],"layer.":[76],"This":[77],"happens":[78],"implicitly":[79],"during":[80],"training":[81,165,210,227,237],"through":[82],"minimizing":[83],"supervised":[85],"or":[86],"unsupervised":[87],"loss.":[88],"In":[89],"this":[90],"letter,":[91],"we":[92,205],"study":[93],"dynamics":[95],"implicit":[98],"representation":[100],"learning.":[101],"We":[102],"identify":[103],"pair":[105],"new":[108,209],"assumption":[109,118,186],"novel":[112],"condition,":[113],"called":[114],"on-model":[116,127,184],"structure":[117,128,185,198],"data":[121,131,215,231,274],"architecture":[122,132,216],"alignment":[123,133,217],"condition.":[124],"Under":[125],"assumption,":[129],"condition":[134,218],"shown":[136,247],"be":[138,188],"sufficient":[139],"global":[142,147,256],"convergence":[143,257],"necessary":[145],"optimality.":[148],"Moreover,":[149],"our":[150],"theory":[151],"explains":[152],"how":[153],"when":[155],"increasing":[156],"size":[158],"does":[159,161],"not":[162],"improve":[163],"behaviors":[166],"practical":[169,174],"regime.":[170],"Our":[171],"results":[172],"provide":[173],"guidance":[175],"designing":[177],"model":[179,197],"structure;":[180],"can":[187],"justification":[192],"using":[194],"particular":[196],"instead":[199],"others.":[201],"As":[202],"an":[203],"application,":[204],"then":[206],"derive":[207],"framework,":[211],"satisfies":[213],"without":[219],"assuming":[220],"it":[221],"by":[222],"modifying":[224],"any":[225],"algorithm":[228],"dependent":[229],"on":[230],"architecture.":[233],"Given":[234],"standard":[236,272],"algorithm,":[238],"framework":[240],"running":[241],"modified":[243],"version":[244],"empirically":[246],"maintain":[249],"competitive":[250],"(practical)":[251],"test":[252],"performances":[253],"while":[254],"providing":[255],"guarantees":[258],"residual":[261],"networks":[263],"with":[264,271],"convolutions,":[265],"skip":[266],"connections,":[267],"batch":[269],"normalization":[270],"benchmark":[273],"sets,":[275],"including":[276],"MNIST,":[277],"CIFAR-10,":[278],"CIFAR-100,":[279],"Semeion,":[280],"KMNIST,":[281],"SVHN.":[283]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
