{"id":"https://openalex.org/W7151501969","doi":"https://doi.org/10.48550/arxiv.2604.03619","title":"Can Natural Image Autoencoders Compactly Tokenize fMRI Volumes for Long-Range Dynamics Modeling?","display_name":"Can Natural Image Autoencoders Compactly Tokenize fMRI Volumes for Long-Range Dynamics Modeling?","publication_year":2026,"publication_date":"2026-04-04","ids":{"openalex":"https://openalex.org/W7151501969","doi":"https://doi.org/10.48550/arxiv.2604.03619"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.03619","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.03619","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.03619","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5002655451","display_name":"P. Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Peter Yongho","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069877330","display_name":"Juhyeon Park","orcid":"https://orcid.org/0000-0001-7142-3922"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Park, Juhyeon","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133112618","display_name":"Jungwoo Park","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Park, Jungwoo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121187211","display_name":"Jubin Choi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Choi, Jubin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059205166","display_name":"Jungwoo Seo","orcid":"https://orcid.org/0009-0002-9008-1678"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Seo, Jungwoo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033979262","display_name":"Jiook Cha","orcid":"https://orcid.org/0000-0002-5314-7992"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cha, Jiook","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5080346989","display_name":"Taesup Moon","orcid":"https://orcid.org/0000-0002-9257-6503"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Moon, Taesup","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10241","display_name":"Functional Brain Connectivity Studies","score":0.9605000019073486,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10241","display_name":"Functional Brain Connectivity Studies","score":0.9605000019073486,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10429","display_name":"EEG and Brain-Computer Interfaces","score":0.015399999916553497,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10378","display_name":"Advanced MRI Techniques and Applications","score":0.0026000000070780516,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/functional-magnetic-resonance-imaging","display_name":"Functional magnetic resonance imaging","score":0.5490000247955322},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.5408999919891357},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5134999752044678},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4837000072002411},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4494999945163727},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.4490000009536743},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.43220001459121704},{"id":"https://openalex.org/keywords/human-connectome-project","display_name":"Human Connectome Project","score":0.4122999906539917},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.40380001068115234}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7900000214576721},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5996000170707703},{"id":"https://openalex.org/C2779226451","wikidata":"https://www.wikidata.org/wiki/Q903809","display_name":"Functional magnetic resonance imaging","level":2,"score":0.5490000247955322},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.5408999919891357},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5134999752044678},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4837000072002411},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4494999945163727},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.4490000009536743},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.43220001459121704},{"id":"https://openalex.org/C97820695","wikidata":"https://www.wikidata.org/wiki/Q387749","display_name":"Human Connectome Project","level":3,"score":0.4122999906539917},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.40380001068115234},{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.4036000072956085},{"id":"https://openalex.org/C111030470","wikidata":"https://www.wikidata.org/wiki/Q1430460","display_name":"Curse of dimensionality","level":2,"score":0.3677000105381012},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.34769999980926514},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3353999853134155},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.3221000134944916},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.3188000023365021},{"id":"https://openalex.org/C2781181686","wikidata":"https://www.wikidata.org/wiki/Q4226068","display_name":"Coherence (philosophical gambling strategy)","level":2,"score":0.31209999322891235},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3070000112056732},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.28119999170303345},{"id":"https://openalex.org/C66024118","wikidata":"https://www.wikidata.org/wiki/Q1122506","display_name":"Computational model","level":2,"score":0.2752000093460083},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.27160000801086426},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.2662999927997589},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.26269999146461487},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.2619999945163727},{"id":"https://openalex.org/C70518039","wikidata":"https://www.wikidata.org/wiki/Q16000077","display_name":"Dimensionality reduction","level":2,"score":0.26159998774528503},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.2603999972343445}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.03619","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.03619","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.03619","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.03619","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Modeling":[0],"long-range":[1],"spatiotemporal":[2,166],"dynamics":[3],"in":[4,114,121],"functional":[5],"Magnetic":[6],"Resonance":[7],"Imaging":[8],"(fMRI)":[9],"remains":[10],"a":[11,58,66,79,89,138,159],"key":[12],"challenge":[13],"due":[14],"to":[15,144],"the":[16,20,100,127,132,149],"high":[17],"dimensionality":[18],"of":[19,82,168],"four-dimensional":[21],"signals.":[22],"Prior":[23],"voxel-based":[24,129],"models,":[25],"although":[26],"demonstrating":[27,118],"excellent":[28],"performance":[29,151],"and":[30,39,107,123,164],"interpretation":[31],"capabilities,":[32],"are":[33],"constrained":[34],"by":[35],"prohibitive":[36],"memory":[37,124],"demands":[38],"thus":[40],"can":[41],"only":[42],"capture":[43],"limited":[44,94],"temporal":[45],"windows.":[46],"To":[47],"address":[48],"this,":[49],"we":[50,136],"propose":[51],"TABLeT":[52,110],"(Two-dimensionally":[53],"Autoencoded":[54],"Brain":[55],"Latent":[56],"Transformer),":[57],"novel":[59],"approach":[60,143,161],"that":[61],"tokenizes":[62],"fMRI":[63,74],"volumes":[64],"using":[65],"pre-trained":[67],"2D":[68],"natural":[69],"image":[70],"autoencoder.":[71],"Each":[72],"3D":[73],"volume":[75],"is":[76,173],"compressed":[77],"into":[78],"compact":[80],"set":[81],"continuous":[83],"tokens,":[84],"enabling":[85],"long-sequence":[86],"modeling":[87,142,167],"with":[88,93],"simple":[90],"Transformer":[91],"encoder":[92],"VRAM.":[95],"Across":[96],"large-scale":[97],"benchmarks":[98],"including":[99],"UK-Biobank":[101],"(UKB),":[102],"Human":[103],"Connectome":[104],"Project":[105],"(HCP),":[106],"ADHD-200":[108],"datasets,":[109],"outperforms":[111],"existing":[112],"models":[113],"multiple":[115],"tasks,":[116],"while":[117],"substantial":[119],"gains":[120],"computational":[122],"efficiency":[125],"over":[126],"state-of-the-art":[128],"method":[130],"given":[131],"same":[133],"input.":[134],"Furthermore,":[135],"develop":[137],"self-supervised":[139],"masked":[140],"token":[141],"pre-train":[145],"TABLeT,":[146],"which":[147],"improves":[148],"model's":[150],"for":[152,162],"various":[153],"downstream":[154],"tasks.":[155],"Our":[156,171],"findings":[157],"suggest":[158],"promising":[160],"scalable":[163],"interpretable":[165],"brain":[169],"activity.":[170],"code":[172],"available":[174],"at":[175],"https://github.com/beotborry/TABLeT.":[176]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2026-04-08T00:00:00"}
