{"id":"https://openalex.org/W4416960678","doi":"https://doi.org/10.1109/tpami.2025.3639593","title":"Large-Scale 3D Medical Image Pre-Training With Geometric Context Priors","display_name":"Large-Scale 3D Medical Image Pre-Training With Geometric Context Priors","publication_year":2025,"publication_date":"2025-12-03","ids":{"openalex":"https://openalex.org/W4416960678","doi":"https://doi.org/10.1109/tpami.2025.3639593","pmid":"https://pubmed.ncbi.nlm.nih.gov/41336163"},"language":"en","primary_location":{"id":"doi:10.1109/tpami.2025.3639593","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2025.3639593","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5066318907","display_name":"Linshan Wu","orcid":"https://orcid.org/0000-0002-0486-184X"},"institutions":[{"id":"https://openalex.org/I200769079","display_name":"Hong Kong University of Science and Technology","ror":"https://ror.org/00q4vv597","country_code":"HK","type":"education","lineage":["https://openalex.org/I200769079"]}],"countries":["HK"],"is_corresponding":true,"raw_author_name":"Linshan Wu","raw_affiliation_strings":["Department of Computer Science and Engineering, The Hong Kong University of Science and Technology, Hong Kong","Department of Computer Science and Engineering, The Hong Kong University of Science and Technology, Hong Kong, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, The Hong Kong University of Science and Technology, Hong Kong","institution_ids":["https://openalex.org/I200769079"]},{"raw_affiliation_string":"Department of Computer Science and Engineering, The Hong Kong University of Science and Technology, Hong Kong, China","institution_ids":["https://openalex.org/I200769079"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033396445","display_name":"Jiaxin Zhuang","orcid":"https://orcid.org/0000-0001-9287-4263"},"institutions":[{"id":"https://openalex.org/I200769079","display_name":"Hong Kong University of Science and Technology","ror":"https://ror.org/00q4vv597","country_code":"HK","type":"education","lineage":["https://openalex.org/I200769079"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Jiaxin Zhuang","raw_affiliation_strings":["Department of Computer Science and Engineering, The Hong Kong University of Science and Technology, Hong Kong","Department of Computer Science and Engineering, The Hong Kong University of Science and Technology, Hong Kong, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, The Hong Kong University of Science and Technology, Hong Kong","institution_ids":["https://openalex.org/I200769079"]},{"raw_affiliation_string":"Department of Computer Science and Engineering, The Hong Kong University of Science and Technology, Hong Kong, China","institution_ids":["https://openalex.org/I200769079"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100353596","display_name":"Hao Chen","orcid":"https://orcid.org/0000-0002-8400-3780"},"institutions":[{"id":"https://openalex.org/I200769079","display_name":"Hong Kong University of Science and Technology","ror":"https://ror.org/00q4vv597","country_code":"HK","type":"education","lineage":["https://openalex.org/I200769079"]},{"id":"https://openalex.org/I889458895","display_name":"University of Hong Kong","ror":"https://ror.org/02zhqgq86","country_code":"HK","type":"education","lineage":["https://openalex.org/I889458895"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Hao Chen","raw_affiliation_strings":["Department of Computer Science and Engineering, Department of Chemical and Biological Engineering and Division of Life Science, Hong Kong University of Science and Technology, Hong Kong","Department of Computer Science and Engineering, Department of Chemical and Biological Engineering and Division of Life Science, Hong Kong University of Science and Technology, Hong Kong, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Department of Chemical and Biological Engineering and Division of Life Science, Hong Kong University of Science and Technology, Hong Kong","institution_ids":["https://openalex.org/I200769079","https://openalex.org/I889458895"]},{"raw_affiliation_string":"Department of Computer Science and Engineering, Department of Chemical and Biological Engineering and Division of Life Science, Hong Kong University of Science and Technology, Hong Kong, China","institution_ids":["https://openalex.org/I200769079","https://openalex.org/I889458895"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5066318907"],"corresponding_institution_ids":["https://openalex.org/I200769079"],"apc_list":null,"apc_paid":null,"fwci":4.8723,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.95637867,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":"48","issue":"3","first_page":"3801","last_page":"3818"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.24539999663829803,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.24539999663829803,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11775","display_name":"COVID-19 diagnosis using AI","score":0.155799999833107,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10862","display_name":"AI in cancer detection","score":0.13050000369548798,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.6362000107765198},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5364999771118164},{"id":"https://openalex.org/keywords/prior-probability","display_name":"Prior probability","score":0.5224000215530396},{"id":"https://openalex.org/keywords/medical-imaging","display_name":"Medical imaging","score":0.5160999894142151},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.46389999985694885},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.4016999900341034},{"id":"https://openalex.org/keywords/medical-diagnosis","display_name":"Medical diagnosis","score":0.38350000977516174},{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.3596999943256378},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3522000014781952}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.699400007724762},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6762999892234802},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.6362000107765198},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5364999771118164},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.5224000215530396},{"id":"https://openalex.org/C31601959","wikidata":"https://www.wikidata.org/wiki/Q931309","display_name":"Medical imaging","level":2,"score":0.5160999894142151},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.46389999985694885},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.44929999113082886},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.4016999900341034},{"id":"https://openalex.org/C534262118","wikidata":"https://www.wikidata.org/wiki/Q177719","display_name":"Medical diagnosis","level":2,"score":0.38350000977516174},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.3596999943256378},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3522000014781952},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.3407000005245209},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.33889999985694885},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3375000059604645},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.32170000672340393},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.30140000581741333},{"id":"https://openalex.org/C2776429412","wikidata":"https://www.wikidata.org/wiki/Q4688011","display_name":"Aerial image","level":3,"score":0.2854999899864197},{"id":"https://openalex.org/C2778828372","wikidata":"https://www.wikidata.org/wiki/Q5283209","display_name":"Distributional semantics","level":3,"score":0.2847000062465668},{"id":"https://openalex.org/C4554734","wikidata":"https://www.wikidata.org/wiki/Q593744","display_name":"Knowledge base","level":2,"score":0.2840999960899353},{"id":"https://openalex.org/C166704113","wikidata":"https://www.wikidata.org/wiki/Q861092","display_name":"Image registration","level":3,"score":0.2777000069618225},{"id":"https://openalex.org/C75294576","wikidata":"https://www.wikidata.org/wiki/Q5165192","display_name":"Contextual image classification","level":3,"score":0.2766999900341034},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.2720000147819519},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.26649999618530273},{"id":"https://openalex.org/C104065381","wikidata":"https://www.wikidata.org/wiki/Q1002535","display_name":"Geometric modeling","level":2,"score":0.25949999690055847},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.2556999921798706},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.2538999915122986}],"mesh":[{"descriptor_ui":"D000069550","descriptor_name":"Machine Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000069550","descriptor_name":"Machine Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D007090","descriptor_name":"Image Interpretation, Computer-Assisted","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D007090","descriptor_name":"Image Interpretation, Computer-Assisted","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D021621","descriptor_name":"Imaging, Three-Dimensional","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D021621","descriptor_name":"Imaging, Three-Dimensional","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true}],"locations_count":3,"locations":[{"id":"doi:10.1109/tpami.2025.3639593","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2025.3639593","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},{"id":"pmid:41336163","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/41336163","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on pattern analysis and machine intelligence","raw_type":null},{"id":"pmh:oai:repository.hkust.edu.hk:1783.1-167083","is_oa":false,"landing_page_url":"http://repository.hkust.edu.hk/ir/Record/1783.1-167083","pdf_url":null,"source":{"id":"https://openalex.org/S4306401796","display_name":"Rare & Special e-Zone (The Hong Kong University of Science and Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I200769079","host_organization_name":"Hong Kong University of Science and Technology","host_organization_lineage":["https://openalex.org/I200769079"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3610329574","display_name":null,"funder_award_id":"MHP/002/22","funder_id":"https://openalex.org/F4320324196","funder_display_name":"Innovation and Technology Commission - Hong Kong"},{"id":"https://openalex.org/G7536321984","display_name":null,"funder_award_id":"GHP/006/22GD","funder_id":"https://openalex.org/F4320324196","funder_display_name":"Innovation and Technology Commission - Hong Kong"},{"id":"https://openalex.org/G7914536803","display_name":null,"funder_award_id":"ITS/028/21FP","funder_id":"https://openalex.org/F4320324196","funder_display_name":"Innovation and Technology Commission - Hong Kong"}],"funders":[{"id":"https://openalex.org/F4320324196","display_name":"Innovation and Technology Commission - Hong Kong","ror":"https://ror.org/04vf9tr09"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0,54],"scarcity":[1],"of":[2,37,140,235],"annotations":[3],"poses":[4],"a":[5,29,89,101,141,217],"significant":[6],"challenge":[7,56],"in":[8,49,58],"medical":[9,22,50,73,181,213,222],"image":[10,182],"analysis,":[11],"which":[12,86,187],"demands":[13],"extensive":[14],"efforts":[15],"from":[16,122],"radiologists,":[17],"especially":[18],"for":[19,92,112,131,206],"high-dimension":[20],"3D":[21,72],"images.":[23],"Large-scale":[24],"pre-training":[25,44,183],"has":[26],"emerged":[27],"as":[28],"promising":[30,90,238],"label-efficient":[31],"solution,":[32],"owing":[33],"to":[34,88,107,125,148,185,211,240],"the":[35,137,149,158,179,233],"utilization":[36],"large-scale":[38,60],"data,":[39],"large":[40],"models,":[41],"and":[42,63,128,203,228,243,255],"advanced":[43],"techniques.":[45],"However,":[46],"its":[47,146],"development":[48],"images":[51,74],"remains":[52],"underexplored.":[53],"primary":[55],"lies":[57],"harnessing":[59],"unlabeled":[61],"data":[62],"learning":[64,93,168],"high-level":[65,166],"semantics":[66],"without":[67,169],"annotations.":[68,170],"We":[69],"observe":[70],"that":[71],"exhibit":[75],"consistent":[76,80,94],"geometric":[77,81,109,160],"context,":[78],"i.e.,":[79],"relations":[82],"between":[83],"different":[84,123,208],"organs,":[85],"leads":[87],"way":[91],"representations.":[95],"Motivated":[96],"by":[97,144],"this,":[98],"we":[99,118,135,174],"introduce":[100,176],"simple-yet-effective":[102],"Volume":[103],"Contrast":[104],"(VoCo)":[105],"framework":[106],"leverage":[108],"context":[110,161],"priors":[111],"self-supervision.":[113],"Given":[114],"an":[115],"input":[116],"volume,":[117],"extract":[119],"base":[120,150],"crops":[121],"regions":[124],"construct":[126],"positive":[127],"negative":[129],"pairs":[130],"contrastive":[132],"learning.":[133],"Then":[134],"predict":[136],"contextual":[138],"position":[139],"random":[142],"crop":[143],"contrasting":[145],"similarity":[147],"crops.":[151],"In":[152],"this":[153],"way,":[154],"VoCo":[155,245],"implicitly":[156],"encodes":[157],"inherent":[159],"into":[162],"model":[163,209],"representations,":[164],"facilitating":[165],"semantic":[167],"To":[171],"assess":[172],"effectiveness,":[173],"(1)":[175],"PreCT-160":[177],"K,":[178],"largest":[180],"dataset":[184],"date,":[186],"comprises":[188],"160":[189],"K":[190],"Computed":[191],"Tomography":[192],"(CT)":[193],"volumes":[194],"covering":[195],"diverse":[196],"anatomic":[197],"structures;":[198],"(2)":[199],"investigate":[200],"scaling":[201],"laws":[202],"propose":[204],"guidelines":[205],"tailoring":[207],"sizes":[210],"various":[212],"tasks;":[214],"(3)":[215],"build":[216],"comprehensive":[218],"benchmark":[219],"encompassing":[220],"51":[221],"tasks,":[223],"including":[224],"segmentation,":[225],"classification,":[226],"registration,":[227],"vision-language.":[229],"Extensive":[230],"experiments":[231],"highlight":[232],"superiority":[234],"VoCo,":[236],"showcasing":[237],"transferability":[239],"unseen":[241],"modalities":[242],"datasets.":[244],"notably":[246],"enhances":[247],"performance":[248],"on":[249],"datasets":[250],"with":[251],"limited":[252],"labeled":[253],"cases":[254],"significantly":[256],"expedites":[257],"fine-tuning":[258],"convergence.":[259]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-12-03T00:00:00"}
