{"id":"https://openalex.org/W4408352882","doi":"https://doi.org/10.1109/icassp49660.2025.10889827","title":"Low Rank and Sparse Fourier Structure in Recurrent Networks Trained on Modular Addition","display_name":"Low Rank and Sparse Fourier Structure in Recurrent Networks Trained on Modular Addition","publication_year":2025,"publication_date":"2025-03-12","ids":{"openalex":"https://openalex.org/W4408352882","doi":"https://doi.org/10.1109/icassp49660.2025.10889827"},"language":"en","primary_location":{"id":"doi:10.1109/icassp49660.2025.10889827","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10889827","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5079543741","display_name":"Akshay Rangamani","orcid":null},"institutions":[{"id":"https://openalex.org/I118118575","display_name":"New Jersey Institute of Technology","ror":"https://ror.org/05e74xb87","country_code":"US","type":"education","lineage":["https://openalex.org/I118118575"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Akshay Rangamani","raw_affiliation_strings":["New Jersey Institute of Technology,Dept. of Data Science,Newark,NJ,USA"],"affiliations":[{"raw_affiliation_string":"New Jersey Institute of Technology,Dept. of Data Science,Newark,NJ,USA","institution_ids":["https://openalex.org/I118118575"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5079543741"],"corresponding_institution_ids":["https://openalex.org/I118118575"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.05838999,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10792","display_name":"Matrix Theory and Algorithms","score":0.756600022315979,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10792","display_name":"Matrix Theory and Algorithms","score":0.756600022315979,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10083","display_name":"Graphene research and applications","score":0.7038999795913696,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10666","display_name":"Photonic Crystals and Applications","score":0.6933000087738037,"subfield":{"id":"https://openalex.org/subfields/3107","display_name":"Atomic and Molecular Physics, and Optics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/modular-design","display_name":"Modular design","score":0.7119895219802856},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6466131806373596},{"id":"https://openalex.org/keywords/rank","display_name":"Rank (graph theory)","score":0.5760858058929443},{"id":"https://openalex.org/keywords/fourier-transform","display_name":"Fourier transform","score":0.49849891662597656},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.41745585203170776},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.34729278087615967},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.22593343257904053},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.11136376857757568},{"id":"https://openalex.org/keywords/combinatorics","display_name":"Combinatorics","score":0.10463204979896545}],"concepts":[{"id":"https://openalex.org/C101468663","wikidata":"https://www.wikidata.org/wiki/Q1620158","display_name":"Modular design","level":2,"score":0.7119895219802856},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6466131806373596},{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.5760858058929443},{"id":"https://openalex.org/C102519508","wikidata":"https://www.wikidata.org/wiki/Q6520159","display_name":"Fourier transform","level":2,"score":0.49849891662597656},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.41745585203170776},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.34729278087615967},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.22593343257904053},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.11136376857757568},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.10463204979896545},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp49660.2025.10889827","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10889827","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W4231799185","https://openalex.org/W6739901393","https://openalex.org/W6778883912","https://openalex.org/W6803444062","https://openalex.org/W6810970779","https://openalex.org/W6849213839","https://openalex.org/W6849345261","https://openalex.org/W6854378537","https://openalex.org/W6856750695","https://openalex.org/W6858431395","https://openalex.org/W6859298233","https://openalex.org/W6859809320","https://openalex.org/W6869087226","https://openalex.org/W6870774110","https://openalex.org/W6872598165"],"related_works":["https://openalex.org/W2378076731","https://openalex.org/W4286888643","https://openalex.org/W3210795196","https://openalex.org/W2088988140","https://openalex.org/W3171015545","https://openalex.org/W2103019253","https://openalex.org/W2951529875","https://openalex.org/W2614680695","https://openalex.org/W2033914206","https://openalex.org/W2042327336"],"abstract_inverted_index":{"Modular":[0],"addition":[1,36,51],"tasks":[2,52],"serve":[3],"as":[4,103],"a":[5,55,78],"useful":[6],"test":[7],"bed":[8],"for":[9],"observing":[10],"empirical":[11],"phenomena":[12],"in":[13,64,77,81],"deep":[14],"learning,":[15],"including":[16],"the":[17,65,82,90,99,109],"phenomenon":[18],"of":[19],"grokking.":[20],"Prior":[21],"work":[22],"has":[23],"shown":[24],"that":[25,43,89],"one-layer":[26],"transformer":[27],"architectures":[28],"learn":[29],"Fourier":[30,56,74,83],"Multiplication":[31,57],"circuits":[32],"to":[33,72,94],"solve":[34],"modular":[35,50],"tasks.":[37],"In":[38],"this":[39],"paper,":[40],"we":[41],"show":[42,87],"Recurrent":[44],"Neural":[45],"Networks":[46],"(RNNs)":[47],"trained":[48],"on":[49],"also":[53,86],"use":[54],"strategy.":[58],"We":[59,85],"identify":[60],"low":[61],"rank":[62],"structures":[63],"model":[66,70],"weights,":[67],"and":[68],"attribute":[69],"components":[71],"specific":[73],"frequencies,":[75,97],"resulting":[76],"sparse":[79],"representation":[80],"space.":[84],"empirically":[88],"RNN":[91],"is":[92],"robust":[93],"removing":[95],"individual":[96],"while":[98],"performance":[100],"degrades":[101],"drastically":[102],"more":[104],"frequencies":[105],"are":[106],"ablated":[107],"from":[108],"model.":[110]},"counts_by_year":[],"updated_date":"2025-12-28T23:10:05.387466","created_date":"2025-10-10T00:00:00"}
