{"id":"https://openalex.org/W4388685768","doi":"https://doi.org/10.48550/arxiv.2311.07568","title":"Feature emergence via margin maximization: case studies in algebraic tasks","display_name":"Feature emergence via margin maximization: case studies in algebraic tasks","publication_year":2023,"publication_date":"2023-11-13","ids":{"openalex":"https://openalex.org/W4388685768","doi":"https://doi.org/10.48550/arxiv.2311.07568"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2311.07568","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2311.07568","pdf_url":"https://arxiv.org/pdf/2311.07568","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2311.07568","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5086429101","display_name":"Depen Morwani","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Morwani, Depen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035088357","display_name":"Benjamin Edelman","orcid":"https://orcid.org/0000-0003-0573-2836"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Edelman, Benjamin L.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5093264965","display_name":"Costin-Andrei Oncescu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Oncescu, Costin-Andrei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088011506","display_name":"Rosie Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Rosie","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5108381794","display_name":"Sham M. Kakade","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kakade, Sham","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.98089998960495,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.98089998960495,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11206","display_name":"Model Reduction and Neural Networks","score":0.9800000190734863,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12536","display_name":"Topological and Geometric Data Analysis","score":0.9769999980926514,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/stylized-fact","display_name":"Stylized fact","score":0.7416971921920776},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6951190233230591},{"id":"https://openalex.org/keywords/margin","display_name":"Margin (machine learning)","score":0.684695303440094},{"id":"https://openalex.org/keywords/maximization","display_name":"Maximization","score":0.6725090146064758},{"id":"https://openalex.org/keywords/modular-design","display_name":"Modular design","score":0.5870720148086548},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5730326771736145},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5291643142700195},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5169517397880554},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4757668375968933},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.4206911623477936},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.1696775257587433},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.16879647970199585}],"concepts":[{"id":"https://openalex.org/C38935604","wikidata":"https://www.wikidata.org/wiki/Q4330363","display_name":"Stylized fact","level":2,"score":0.7416971921920776},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6951190233230591},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.684695303440094},{"id":"https://openalex.org/C2776330181","wikidata":"https://www.wikidata.org/wiki/Q18358244","display_name":"Maximization","level":2,"score":0.6725090146064758},{"id":"https://openalex.org/C101468663","wikidata":"https://www.wikidata.org/wiki/Q1620158","display_name":"Modular design","level":2,"score":0.5870720148086548},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5730326771736145},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5291643142700195},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5169517397880554},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4757668375968933},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.4206911623477936},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.1696775257587433},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.16879647970199585},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C139719470","wikidata":"https://www.wikidata.org/wiki/Q39680","display_name":"Macroeconomics","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2311.07568","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2311.07568","pdf_url":"https://arxiv.org/pdf/2311.07568","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},{"id":"doi:10.48550/arxiv.2311.07568","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2311.07568","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2311.07568","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2311.07568","pdf_url":"https://arxiv.org/pdf/2311.07568","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1264789558","display_name":null,"funder_award_id":"W911NF2010021","funder_id":"https://openalex.org/F4320332180","funder_display_name":"Defense Advanced Research Projects Agency"},{"id":"https://openalex.org/G3521671702","display_name":null,"funder_award_id":"2134157","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G4720003262","display_name":null,"funder_award_id":"N00014-22","funder_id":"https://openalex.org/F4320337345","funder_display_name":"Office of Naval Research"},{"id":"https://openalex.org/G5224039946","display_name":null,"funder_award_id":"DE-SC0022199","funder_id":"https://openalex.org/F4320306084","funder_display_name":"U.S. Department of Energy"},{"id":"https://openalex.org/G5877837315","display_name":null,"funder_award_id":"DE-SC0022199","funder_id":"https://openalex.org/F4320332180","funder_display_name":"Defense Advanced Research Projects Agency"},{"id":"https://openalex.org/G8876996369","display_name":null,"funder_award_id":"N00014","funder_id":"https://openalex.org/F4320337345","funder_display_name":"Office of Naval Research"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320306084","display_name":"U.S. Department of Energy","ror":"https://ror.org/01bj3aw27"},{"id":"https://openalex.org/F4320332180","display_name":"Defense Advanced Research Projects Agency","ror":"https://ror.org/02caytj08"},{"id":"https://openalex.org/F4320337345","display_name":"Office of Naval Research","ror":"https://ror.org/00rk2pe57"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2529311304","https://openalex.org/W4248275646","https://openalex.org/W2992609826","https://openalex.org/W3124809058","https://openalex.org/W2552900035","https://openalex.org/W2162875951","https://openalex.org/W2062875858","https://openalex.org/W4380047323","https://openalex.org/W2138330538","https://openalex.org/W1886423216"],"abstract_inverted_index":{"Understanding":[0],"the":[1,13,56,75,92,104,108,114,141],"internal":[2],"representations":[3,131],"learned":[4,77,106],"by":[5,78,107],"neural":[6,31,80,167],"networks":[7,32,46,81,116,168],"is":[8],"a":[9,40,162],"cornerstone":[10],"challenge":[11],"in":[12,25,135],"science":[14],"of":[15,60,94,144,165],"machine":[16],"learning.":[17],"While":[18],"there":[19],"have":[20],"been":[21],"significant":[22],"recent":[23],"strides":[24],"some":[26],"cases":[27],"towards":[28],"understanding":[29,164],"how":[30,91],"implement":[33],"specific":[34,170],"target":[35],"functions,":[36],"this":[37],"paper":[38],"explores":[39],"complementary":[41],"question":[42],"--":[43],"why":[44,166],"do":[45],"arrive":[47],"at":[48],"particular":[49],"computational":[50,171],"strategies?":[51],"Our":[52,69],"inquiry":[53],"focuses":[54],"on":[55],"algebraic":[57,84],"learning":[58],"tasks":[59],"modular":[61,122],"addition,":[62],"sparse":[63],"parities,":[64],"and":[65,124,148],"finite":[66],"group":[67],"operations.":[68],"primary":[70],"theoretical":[71],"findings":[72],"analytically":[73],"characterize":[74],"features":[76,105,119,126],"stylized":[79],"for":[82],"these":[83],"tasks.":[85],"Notably,":[86],"our":[87,156],"main":[88],"technique":[89],"demonstrates":[90],"principle":[93],"margin":[95],"maximization":[96],"alone":[97],"can":[98,158],"be":[99],"used":[100],"to":[101,120,128,132,160],"fully":[102],"specify":[103],"network.":[109],"Specifically,":[110],"we":[111,154],"prove":[112],"that":[113],"trained":[115],"utilize":[117],"Fourier":[118],"perform":[121,133],"addition":[123],"employ":[125],"corresponding":[127],"irreducible":[129],"group-theoretic":[130],"compositions":[134],"general":[136],"groups,":[137],"aligning":[138],"closely":[139],"with":[140],"empirical":[142],"observations":[143],"Nanda":[145],"et":[146,150],"al.":[147,151],"Chughtai":[149],"More":[152],"generally,":[153],"hope":[155],"techniques":[157],"help":[159],"foster":[161],"deeper":[163],"adopt":[169],"strategies.":[172]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2023-11-15T00:00:00"}
