{"id":"https://openalex.org/W7139035611","doi":"https://doi.org/10.48550/arxiv.2603.15980","title":"Standardizing Medical Images at Scale for AI","display_name":"Standardizing Medical Images at Scale for AI","publication_year":2026,"publication_date":"2026-03-16","ids":{"openalex":"https://openalex.org/W7139035611","doi":"https://doi.org/10.48550/arxiv.2603.15980"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.15980","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.15980","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.15980","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5064828254","display_name":"Callen MacPhee","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"MacPhee, Callen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129822293","display_name":"Yiming Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Yiming","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059003896","display_name":"Koichiro Kishima","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kishima, Koichiro","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5057807483","display_name":"Bahram Jalali","orcid":"https://orcid.org/0000-0002-0169-8231"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jalali, Bahram","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10862","display_name":"AI in cancer detection","score":0.3149000108242035,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10862","display_name":"AI in cancer detection","score":0.3149000108242035,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11897","display_name":"Digital Holography and Microscopy","score":0.2184000015258789,"subfield":{"id":"https://openalex.org/subfields/3107","display_name":"Atomic and Molecular Physics, and Optics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11183","display_name":"Advanced X-ray Imaging Techniques","score":0.07129999995231628,"subfield":{"id":"https://openalex.org/subfields/3108","display_name":"Radiation"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/preprocessor","display_name":"Preprocessor","score":0.8050000071525574},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.5152000188827515},{"id":"https://openalex.org/keywords/data-pre-processing","display_name":"Data pre-processing","score":0.5076000094413757},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.5040000081062317},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.4918999969959259},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4641000032424927},{"id":"https://openalex.org/keywords/medical-imaging","display_name":"Medical imaging","score":0.4609000086784363},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.4447999894618988},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4433000087738037}],"concepts":[{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.8050000071525574},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7146999835968018},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6661999821662903},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.5152000188827515},{"id":"https://openalex.org/C10551718","wikidata":"https://www.wikidata.org/wiki/Q5227332","display_name":"Data pre-processing","level":2,"score":0.5076000094413757},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.5040000081062317},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.4918999969959259},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4641000032424927},{"id":"https://openalex.org/C31601959","wikidata":"https://www.wikidata.org/wiki/Q931309","display_name":"Medical imaging","level":2,"score":0.4609000086784363},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4481000006198883},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.4447999894618988},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4433000087738037},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.42570000886917114},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3662000000476837},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3312000036239624},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.31139999628067017},{"id":"https://openalex.org/C55020928","wikidata":"https://www.wikidata.org/wiki/Q3813865","display_name":"Image quality","level":3,"score":0.29249998927116394},{"id":"https://openalex.org/C534262118","wikidata":"https://www.wikidata.org/wiki/Q177719","display_name":"Medical diagnosis","level":2,"score":0.29190000891685486},{"id":"https://openalex.org/C75294576","wikidata":"https://www.wikidata.org/wiki/Q5165192","display_name":"Contextual image classification","level":3,"score":0.289900004863739},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.28870001435279846},{"id":"https://openalex.org/C2781195486","wikidata":"https://www.wikidata.org/wiki/Q289436","display_name":"Texture (cosmology)","level":3,"score":0.2879999876022339},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.27250000834465027},{"id":"https://openalex.org/C123614077","wikidata":"https://www.wikidata.org/wiki/Q1364905","display_name":"Propagation of uncertainty","level":2,"score":0.27230000495910645},{"id":"https://openalex.org/C147764199","wikidata":"https://www.wikidata.org/wiki/Q6865248","display_name":"Minification","level":2,"score":0.26980000734329224},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.2655999958515167},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.25690001249313354},{"id":"https://openalex.org/C142575187","wikidata":"https://www.wikidata.org/wiki/Q3358290","display_name":"Pyramid (geometry)","level":2,"score":0.2517000138759613},{"id":"https://openalex.org/C163985040","wikidata":"https://www.wikidata.org/wiki/Q1172399","display_name":"Data acquisition","level":2,"score":0.25099998712539673}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.15980","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.15980","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.15980","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.15980","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Deep":[0],"learning":[1],"has":[2],"achieved":[3],"remarkable":[4],"success":[5],"in":[6,23,191],"medical":[7,61,177],"image":[8],"analysis,":[9],"yet":[10],"its":[11],"performance":[12],"remains":[13],"highly":[14],"sensitive":[15],"to":[16,111,131],"the":[17,51,115,145],"heterogeneity":[18],"of":[19,57],"clinical":[20,192],"data.":[21],"Differences":[22],"imaging":[24],"hardware,":[25],"staining":[26],"protocols,":[27],"and":[28,98,106,137,151,189],"acquisition":[29],"conditions":[30],"produce":[31],"substantial":[32],"domain":[33],"shifts":[34],"that":[35,79,179],"degrade":[36],"model":[37],"generalization":[38],"across":[39],"institutions.":[40],"Here":[41],"we":[42],"present":[43],"a":[44,81,158,172],"physics-based":[45],"data":[46,174],"preprocessing":[47,119,160],"framework":[48,71],"based":[49],"on":[50],"PhyCV":[52,118,170],"(Physics-Inspired":[53],"Computer":[54],"Vision)":[55],"family":[56],"algorithms,":[58],"which":[59],"standardizes":[60],"images":[62,73,113],"through":[63,183],"deterministic":[64],"transformations":[65],"derived":[66],"from":[67,114,125],"optical":[68,77],"physics.":[69],"The":[70],"models":[72],"as":[74,96,157,171],"spatially":[75],"varying":[76],"fields":[78],"undergo":[80],"virtual":[82],"diffractive":[83],"propagation":[84],"followed":[85],"by":[86],"coherent":[87],"phase":[88],"detection.":[89],"This":[90],"process":[91],"suppresses":[92],"non-semantic":[93],"variability":[94],"such":[95],"color":[97],"illumination":[99],"differences":[100],"while":[101],"preserving":[102],"diagnostically":[103],"relevant":[104],"texture":[105],"structural":[107],"features.":[108],"When":[109],"applied":[110],"histopathological":[112],"Camelyon17-WILDS":[116],"benchmark,":[117],"improves":[120],"out-of-distribution":[121],"breast-cancer":[122],"classification":[123],"accuracy":[124],"70.8%":[126],"(Empirical":[127],"Risk":[128],"Minimization":[129],"baseline)":[130],"90.9%,":[132],"matching":[133],"or":[134,162],"exceeding":[135],"data-augmentation":[136],"domain-generalization":[138],"approaches":[139],"at":[140],"negligible":[141],"computational":[142],"cost.":[143],"Because":[144],"transform":[146],"is":[147],"physically":[148],"interpretable,":[149],"parameterizable,":[150],"differentiable,":[152],"it":[153],"can":[154],"be":[155],"deployed":[156],"fixed":[159],"stage":[161],"integrated":[163],"into":[164],"end-to-end":[165],"learning.":[166],"These":[167],"results":[168],"establish":[169],"generalizable":[173],"refinery":[175],"for":[176],"imaging-one":[178],"harmonizes":[180],"heterogeneous":[181],"datasets":[182],"first-principles":[184],"physics,":[185],"improving":[186],"robustness,":[187],"interpretability,":[188],"reproducibility":[190],"AI":[193],"systems.":[194]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-20T00:00:00"}
