{"id":"https://openalex.org/W7140304791","doi":"https://doi.org/10.48550/arxiv.2603.22539","title":"Generalized multi-object classification and tracking with sparse feature resonator networks","display_name":"Generalized multi-object classification and tracking with sparse feature resonator networks","publication_year":2026,"publication_date":"2026-03-23","ids":{"openalex":"https://openalex.org/W7140304791","doi":"https://doi.org/10.48550/arxiv.2603.22539"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.22539","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22539","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.22539","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5062558710","display_name":"Lazar Supic","orcid":"https://orcid.org/0000-0002-3954-9688"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Supic, Lazar","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130588909","display_name":"Alec Mullen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mullen, Alec","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5130616145","display_name":"E. Paxon Frady","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Frady, E. Paxon","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5062558710"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.33079999685287476,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.33079999685287476,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12611","display_name":"Neural Networks and Reservoir Computing","score":0.18299999833106995,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10245","display_name":"Metamaterials and Metasurfaces Applications","score":0.0754999965429306,"subfield":{"id":"https://openalex.org/subfields/2504","display_name":"Electronic, Optical and Magnetic Materials"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mnist-database","display_name":"MNIST database","score":0.5232999920845032},{"id":"https://openalex.org/keywords/invariant","display_name":"Invariant (physics)","score":0.5077000260353088},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.48739999532699585},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.4666000008583069},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.45399999618530273},{"id":"https://openalex.org/keywords/cognitive-neuroscience-of-visual-object-recognition","display_name":"Cognitive neuroscience of visual object recognition","score":0.4271000027656555},{"id":"https://openalex.org/keywords/equivariant-map","display_name":"Equivariant map","score":0.412200003862381},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.3944000005722046}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6067000031471252},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5928000211715698},{"id":"https://openalex.org/C190502265","wikidata":"https://www.wikidata.org/wiki/Q17069496","display_name":"MNIST database","level":3,"score":0.5232999920845032},{"id":"https://openalex.org/C190470478","wikidata":"https://www.wikidata.org/wiki/Q2370229","display_name":"Invariant (physics)","level":2,"score":0.5077000260353088},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.48739999532699585},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.4666000008583069},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.45399999618530273},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.4271000027656555},{"id":"https://openalex.org/C171036898","wikidata":"https://www.wikidata.org/wiki/Q256355","display_name":"Equivariant map","level":2,"score":0.412200003862381},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.3944000005722046},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.36649999022483826},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3492000102996826},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.3319000005722046},{"id":"https://openalex.org/C171268870","wikidata":"https://www.wikidata.org/wiki/Q1486676","display_name":"GRASP","level":2,"score":0.32910001277923584},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.3176000118255615},{"id":"https://openalex.org/C101468663","wikidata":"https://www.wikidata.org/wiki/Q1620158","display_name":"Modular design","level":2,"score":0.2962999939918518},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.2955000102519989},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.2946000099182129},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.2754000127315521},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.26840001344680786},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.257099986076355},{"id":"https://openalex.org/C149364088","wikidata":"https://www.wikidata.org/wiki/Q185917","display_name":"Translation (biology)","level":4,"score":0.2542000114917755},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.2524999976158142}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.22539","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22539","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.22539","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22539","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"In":[0],"visual":[1],"scene":[2],"understanding":[3],"tasks,":[4],"it":[5],"is":[6,51,184],"essential":[7],"to":[8,21,24,38,64,131,144,176,265],"capture":[9],"both":[10,112],"invariant":[11,113],"and":[12,59,79,96,101,110,114,195,232,256],"equivariant":[13,39,115],"structure.":[14],"While":[15],"neural":[16],"networks":[17],"are":[18],"frequently":[19],"trained":[20,185],"achieve":[22],"invariance":[23,50],"transformations":[25,66],"such":[26],"as":[27,127,198],"translation,":[28],"this":[29],"often":[30],"comes":[31],"at":[32,237],"the":[33,43,88,107,141,151,165,196,215,228,241,253,260],"cost":[34],"of":[35,46,90,138,214,222,245,272],"losing":[36],"access":[37],"information":[40,116,163,244],"-":[41],"e.g.,":[42],"precise":[44],"location":[45],"an":[47,74],"object.":[48],"Moreover,":[49],"not":[52,67],"naturally":[53],"guaranteed":[54],"through":[55],"supervised":[56],"learning":[57],"alone,":[58],"many":[60],"architectures":[61],"generalize":[62],"poorly":[63],"input":[65],"encountered":[68],"during":[69],"training.":[70],"Here,":[71],"we":[72,257],"take":[73],"approach":[75],"based":[76],"on":[77,178,187],"analysis-by-synthesis":[78],"factoring":[80],"using":[81],"resonator":[82,104,142,216,261],"networks.":[83],"A":[84],"generative":[85,108],"model":[86],"describes":[87],"construction":[89],"simple":[91,174],"scenes":[92,223],"containing":[93],"MNIST":[94],"digits":[95],"their":[97],"transformations,":[98],"like":[99],"color":[100],"position.":[102],"The":[103,154,181,210],"network":[105,143,197,217,229],"inverts":[106],"model,":[109],"provides":[111,157],"about":[117,164],"particular":[118,247],"objects.":[119],"Sparse":[120],"features":[121],"learned":[122],"from":[123,150,252],"training":[124,193],"data":[125,208],"act":[126],"a":[128,158,173,199,238,246,273],"basis":[129],"set":[130],"provide":[132],"flexibility":[133],"in":[134],"representing":[135],"variable":[136],"shapes":[137,149],"objects,":[139,226],"allowing":[140,172],"handle":[145],"previously":[146],"unseen":[147],"digit":[148],"test":[152],"set.":[153],"modular":[155],"structure":[156],"shape":[159,167],"module":[160],"which":[161],"contains":[162],"object":[166,236,248],"with":[168,204,224,270],"translation":[169,254],"factored":[170],"out,":[171],"classifier":[175],"operate":[177],"centered":[179,188],"digits.":[180],"classification":[182],"layer":[183],"solely":[186],"data,":[189,194],"requiring":[190],"much":[191],"less":[192],"whole":[200],"can":[201,249,262],"identify":[202],"objects":[203,269],"arbitrary":[205],"translations":[206],"without":[207],"augmentation.":[209],"natural":[211],"attention-like":[212],"mechanism":[213],"also":[218],"allows":[219],"for":[220],"analysis":[221],"multiple":[225,267],"where":[227],"dynamics":[230],"selects":[231],"centers":[233],"only":[234],"one":[235],"time.":[239],"Further,":[240],"specific":[242],"position":[243],"be":[250,263],"extracted":[251],"module,":[255],"show":[258],"that":[259],"designed":[264],"track":[266],"moving":[268],"precision":[271],"few":[274],"pixels.":[275]},"counts_by_year":[],"updated_date":"2026-03-26T06:10:45.909354","created_date":"2026-03-26T00:00:00"}
