{"id":"https://openalex.org/W7133336379","doi":"https://doi.org/10.48550/arxiv.2603.00979","title":"Fake It Right: Injecting Anatomical Logic into Synthetic Supervised Pre-training for Medical Segmentation","display_name":"Fake It Right: Injecting Anatomical Logic into Synthetic Supervised Pre-training for Medical Segmentation","publication_year":2026,"publication_date":"2026-03-01","ids":{"openalex":"https://openalex.org/W7133336379","doi":"https://doi.org/10.48550/arxiv.2603.00979"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.00979","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.00979","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.00979","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5121095427","display_name":"Jiaqi Tang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tang, Jiaqi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127970461","display_name":"Mengyan Zheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zheng, Mengyan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128029699","display_name":"Shu Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Shu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022828476","display_name":"Fandong Zhang","orcid":"https://orcid.org/0000-0003-0655-1180"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Fandong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5127982634","display_name":"Qingchao Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Qingchao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.5328999757766724,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.5328999757766724,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14510","display_name":"Medical Imaging and Analysis","score":0.07400000095367432,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.061900001019239426,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.7164999842643738},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6952000260353088},{"id":"https://openalex.org/keywords/synthetic-data","display_name":"Synthetic data","score":0.5497999787330627},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.4772999882698059},{"id":"https://openalex.org/keywords/supervised-learning","display_name":"Supervised learning","score":0.46810001134872437},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.3930000066757202},{"id":"https://openalex.org/keywords/image-synthesis","display_name":"Image synthesis","score":0.383899986743927},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.37630000710487366},{"id":"https://openalex.org/keywords/bridge","display_name":"Bridge (graph theory)","score":0.35929998755455017}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8093000054359436},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.7164999842643738},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6952000260353088},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.633899986743927},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.5497999787330627},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.4772999882698059},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.46810001134872437},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.454800009727478},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.3930000066757202},{"id":"https://openalex.org/C2989087649","wikidata":"https://www.wikidata.org/wiki/Q176953","display_name":"Image synthesis","level":3,"score":0.383899986743927},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.37630000710487366},{"id":"https://openalex.org/C100776233","wikidata":"https://www.wikidata.org/wiki/Q2532492","display_name":"Bridge (graph theory)","level":2,"score":0.35929998755455017},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.3587999939918518},{"id":"https://openalex.org/C31601959","wikidata":"https://www.wikidata.org/wiki/Q931309","display_name":"Medical imaging","level":2,"score":0.33329999446868896},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.32199999690055847},{"id":"https://openalex.org/C2776145971","wikidata":"https://www.wikidata.org/wiki/Q30673951","display_name":"Labeled data","level":2,"score":0.31369999051094055},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.30799999833106995},{"id":"https://openalex.org/C58973888","wikidata":"https://www.wikidata.org/wiki/Q1041418","display_name":"Semi-supervised learning","level":2,"score":0.29440000653266907},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.2858999967575073},{"id":"https://openalex.org/C152565575","wikidata":"https://www.wikidata.org/wiki/Q1124538","display_name":"Conditional random field","level":2,"score":0.28040000796318054},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.2793000042438507},{"id":"https://openalex.org/C2987255567","wikidata":"https://www.wikidata.org/wiki/Q33002955","display_name":"Knowledge graph","level":2,"score":0.2777000069618225},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.2732999920845032},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.26570001244544983},{"id":"https://openalex.org/C86034646","wikidata":"https://www.wikidata.org/wiki/Q474311","display_name":"Semantic gap","level":4,"score":0.2554999887943268},{"id":"https://openalex.org/C22367795","wikidata":"https://www.wikidata.org/wiki/Q7625208","display_name":"Structured prediction","level":2,"score":0.2529999911785126},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.25279998779296875},{"id":"https://openalex.org/C115051666","wikidata":"https://www.wikidata.org/wiki/Q6522493","display_name":"Ranging","level":2,"score":0.25220000743865967}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.00979","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.00979","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.00979","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.00979","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Vision":[0],"Transformers":[1],"(ViTs)":[2],"excel":[3],"in":[4],"3D":[5],"medical":[6,197],"segmentation":[7,106],"but":[8],"require":[9],"massive":[10],"annotated":[11],"datasets.":[12],"While":[13],"Self-Supervised":[14],"Learning":[15,32],"(SSL)":[16],"mitigates":[17],"this":[18,77],"using":[19,133],"unlabeled":[20],"data,":[21],"it":[22],"still":[23],"faces":[24],"strict":[25],"privacy":[26],"and":[27,61,139,155,167,172],"logistical":[28],"barriers.":[29],"Formula-Driven":[30],"Supervised":[31,84],"(FDSL)":[33],"offers":[34],"a":[35,45,99,114,140,178,192],"privacy-preserving":[36],"alternative":[37],"by":[38,170],"pre-training":[39],"on":[40,153],"synthetic":[41,187],"mathematical":[42],"primitives.":[43],"However,":[44],"critical":[46],"semantic":[47],"gap":[48],"limits":[49],"its":[50],"efficacy:":[51],"generic":[52],"shapes":[53],"lack":[54],"the":[55,121],"morphological":[56],"fidelity,":[57],"fixed":[58],"spatial":[59,134],"layouts,":[60],"inter-organ":[62,145],"relationships":[63],"of":[64,126],"real":[65],"anatomy,":[66],"preventing":[67,148],"models":[68],"from":[69,108],"learning":[70],"essential":[71],"global":[72],"structural":[73],"priors.":[74],"To":[75],"bridge":[76],"gap,":[78],"we":[79,112,129],"propose":[80],"an":[81],"Anatomy-Informed":[82],"Synthetic":[83],"Pre-training":[85],"framework":[86],"unifying":[87],"FDSL's":[88],"infinite":[89],"scalability":[90],"with":[91,98,103,185],"anatomical":[92],"realism.":[93],"We":[94],"replace":[95],"basic":[96],"primitives":[97],"lightweight":[100],"shape":[101],"bank":[102],"de-identified,":[104],"label-only":[105],"masks":[107],"5":[109],"subjects.":[110],"Furthermore,":[111],"introduce":[113],"structure-aware":[115],"sequential":[116],"placement":[117],"strategy":[118],"to":[119,143,174],"govern":[120],"patch":[122],"synthesis":[123],"process.":[124],"Instead":[125],"random":[127],"placement,":[128],"enforce":[130],"physiological":[131],"plausibility":[132],"anchors":[135],"for":[136,196],"correct":[137],"localization":[138],"topological":[141],"graph":[142],"manage":[144],"interactions":[146],"(e.g.,":[147],"impossible":[149],"overlaps).":[150],"Extensive":[151],"experiments":[152],"BTCV":[154],"MSD":[156],"datasets":[157],"demonstrate":[158],"that":[159],"our":[160],"method":[161],"significantly":[162],"outperforms":[163],"state-of-the-art":[164],"FDSL":[165],"baselines":[166],"SSL":[168],"methods":[169],"1.74\\%":[171],"up":[173],"1.66\\%,":[175],"while":[176],"exhibiting":[177],"robust":[179],"scaling":[180],"effect":[181],"where":[182],"performance":[183],"improves":[184],"increased":[186],"data":[188],"volume.":[189],"This":[190],"provides":[191],"data-efficient,":[193],"privacy-compliant":[194],"solution":[195],"segmentation.":[198],"The":[199],"code":[200],"will":[201],"be":[202],"made":[203],"publicly":[204],"available":[205],"upon":[206],"acceptance.":[207]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-04T00:00:00"}
