{"id":"https://openalex.org/W7148519297","doi":"https://doi.org/10.48550/arxiv.2604.00514","title":"MAESIL: Masked Autoencoder for Enhanced Self-supervised Medical Image Learning","display_name":"MAESIL: Masked Autoencoder for Enhanced Self-supervised Medical Image Learning","publication_year":2026,"publication_date":"2026-04-01","ids":{"openalex":"https://openalex.org/W7148519297","doi":"https://doi.org/10.48550/arxiv.2604.00514"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.00514","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.00514","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.00514","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5126342227","display_name":"Kyeonghun Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Kyeonghun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046000978","display_name":"Hyeonseok Jung","orcid":"https://orcid.org/0000-0001-8902-9624"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jung, Hyeonseok","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132808103","display_name":"Youngung Han","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Han, Youngung","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032091387","display_name":"Junsu Lim","orcid":"https://orcid.org/0000-0002-8585-5686"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lim, Junsu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126305680","display_name":"Yeonju Jean","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jean, YeonJu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126305126","display_name":"Seongbin Park","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Park, Seongbin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126336636","display_name":"Eunseob Choi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Choi, Eunseob","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126322351","display_name":"Hyunsu Go","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Go, Hyunsu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073034437","display_name":"Seoyoung Ju","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ju, SeoYoung","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132807243","display_name":"Seohyoung Park","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Park, Seohyoung","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132793441","display_name":"Gyeongmin Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Gyeongmin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126344029","display_name":"Minju Kwon","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kwon, MinJu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126324608","display_name":"Kyungseok Yuh","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yuh, KyungSeok","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132812384","display_name":"Soo Yong Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Soo Yong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028602586","display_name":"Ken Ying-Kai Liao","orcid":"https://orcid.org/0000-0001-7815-8199"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liao, Ken Ying-Kai","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132816820","display_name":"Nam-Joon Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Nam-Joon","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5132830650","display_name":"Hyuk-Jae Lee","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lee, Hyuk-Jae","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.5181000232696533,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.5181000232696533,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.1216999962925911,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.05290000140666962,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/autoencoder","display_name":"Autoencoder","score":0.8148000240325928},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.6248000264167786},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.5770999789237976},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5339999794960022},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.520799994468689},{"id":"https://openalex.org/keywords/medical-imaging","display_name":"Medical imaging","score":0.5188000202178955},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4187999963760376},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4027999937534332},{"id":"https://openalex.org/keywords/limiting","display_name":"Limiting","score":0.3968000113964081}],"concepts":[{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.8148000240325928},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7457000017166138},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7125999927520752},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.6248000264167786},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.5770999789237976},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5339999794960022},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.520799994468689},{"id":"https://openalex.org/C31601959","wikidata":"https://www.wikidata.org/wiki/Q931309","display_name":"Medical imaging","level":2,"score":0.5188000202178955},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.45489999651908875},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4187999963760376},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4027999937534332},{"id":"https://openalex.org/C188198153","wikidata":"https://www.wikidata.org/wiki/Q1613840","display_name":"Limiting","level":2,"score":0.3968000113964081},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3815000057220459},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.37130001187324524},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.36660000681877136},{"id":"https://openalex.org/C2781181686","wikidata":"https://www.wikidata.org/wiki/Q4226068","display_name":"Coherence (philosophical gambling strategy)","level":2,"score":0.3578000068664551},{"id":"https://openalex.org/C8038995","wikidata":"https://www.wikidata.org/wiki/Q1152135","display_name":"Unsupervised learning","level":2,"score":0.34769999980926514},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3472999930381775},{"id":"https://openalex.org/C22367795","wikidata":"https://www.wikidata.org/wiki/Q7625208","display_name":"Structured prediction","level":2,"score":0.34610000252723694},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.29989999532699585},{"id":"https://openalex.org/C58973888","wikidata":"https://www.wikidata.org/wiki/Q1041418","display_name":"Semi-supervised learning","level":2,"score":0.29339998960494995},{"id":"https://openalex.org/C141379421","wikidata":"https://www.wikidata.org/wiki/Q6094427","display_name":"Iterative reconstruction","level":2,"score":0.2872999906539917},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.28439998626708984},{"id":"https://openalex.org/C54170458","wikidata":"https://www.wikidata.org/wiki/Q663554","display_name":"Voxel","level":2,"score":0.2761000096797943},{"id":"https://openalex.org/C2164484","wikidata":"https://www.wikidata.org/wiki/Q5170150","display_name":"Core (optical fiber)","level":2,"score":0.27149999141693115},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.2687999904155731},{"id":"https://openalex.org/C544519230","wikidata":"https://www.wikidata.org/wiki/Q32566","display_name":"Computed tomography","level":2,"score":0.26829999685287476},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.25780001282691956}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.00514","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.00514","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.00514","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.00514","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[{"score":0.6548252105712891,"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Training":[0],"deep":[1],"learning":[2,109],"models":[3],"for":[4,100,208],"three-dimensional":[5],"(3D)":[6],"medical":[7,44,103,210],"imaging,":[8],"such":[9,183,193],"as":[10,48,72,184,194,201],"Computed":[11],"Tomography":[12],"(CT),":[13],"is":[14,28,121],"fundamentally":[15,82],"challenged":[16],"by":[17],"the":[18,59,88,98,122,140],"scarcity":[19],"of":[20,63,75],"labeled":[21],"data.":[22],"While":[23],"pre-training":[24,206],"on":[25,42,164],"natural":[26],"images":[27],"common,":[29],"it":[30],"results":[31,173],"in":[32,189],"a":[33,49,73,106,124,146,152,202],"significant":[34,178],"domain":[35],"shift,":[36],"limiting":[37],"performance.":[38],"Self-Supervised":[39],"Learning":[40],"(SSL)":[41],"unlabeled":[43],"data":[45],"has":[46],"emerged":[47],"powerful":[50],"solution,":[51],"but":[52],"prominent":[53],"frameworks":[54],"often":[55],"fail":[56],"to":[57,112,155],"exploit":[58],"inherent":[60],"3D":[61,70,89,114,125,131,147,209],"nature":[62],"CT":[64,169],"scans.":[65],"These":[66],"methods":[67,182],"typically":[68],"process":[69],"scans":[71],"collection":[74],"independent":[76],"2D":[77],"slices,":[78],"an":[79],"approach":[80,163],"that":[81,129,175],"discards":[83],"critical":[84],"axial":[85],"coherence":[86],"and":[87,144,187,196,204],"structural":[90,115],"context.":[91],"To":[92],"address":[93],"this":[94],"limitation,":[95],"we":[96],"propose":[97],"autoencoder":[99,149],"enhanced":[101],"self-supervised":[102,108],"image":[104],"learning(MAESIL),":[105],"novel":[107],"framework":[110,138],"designed":[111],"capture":[113],"information":[116],"efficiently.":[117],"The":[118],"core":[119],"innovation":[120],"'superpatch',":[123],"chunk-based":[126],"input":[127],"unit":[128],"balances":[130],"context":[132],"preservation":[133],"with":[134,151],"computational":[135],"efficiency.":[136],"Our":[137,171],"partitions":[139],"volume":[141],"into":[142],"superpatches":[143],"employs":[145],"masked":[148],"strategy":[150,154],"dual-masking":[153],"learn":[156],"comprehensive":[157],"spatial":[158],"representations.":[159],"We":[160],"validated":[161],"our":[162],"three":[165],"diverse":[166],"large-scale":[167],"public":[168],"datasets.":[170],"experimental":[172],"show":[174],"MAESIL":[176,200],"demonstrates":[177],"improvements":[179],"over":[180],"existing":[181],"AE,":[185],"VAE":[186],"VQ-VAE":[188],"key":[190],"reconstruction":[191],"metrics":[192],"PSNR":[195],"SSIM.":[197],"This":[198],"establishes":[199],"robust":[203],"practical":[205],"solution":[207],"imaging":[211],"tasks.":[212]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2026-04-03T00:00:00"}
