{"id":"https://openalex.org/W4416078506","doi":"https://doi.org/10.1145/3746252.3760875","title":"Rethinking Masked Image Modeling for Ultrasound Image Denoising","display_name":"Rethinking Masked Image Modeling for Ultrasound Image Denoising","publication_year":2025,"publication_date":"2025-11-10","ids":{"openalex":"https://openalex.org/W4416078506","doi":"https://doi.org/10.1145/3746252.3760875"},"language":null,"primary_location":{"id":"doi:10.1145/3746252.3760875","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3746252.3760875","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 34th ACM International Conference on Information and Knowledge Management","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3746252.3760875","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5009598097","display_name":"Yuchong Yao","orcid":"https://orcid.org/0000-0001-8368-4978"},"institutions":[{"id":"https://openalex.org/I165779595","display_name":"University of Melbourne","ror":"https://ror.org/01ej9dk98","country_code":"AU","type":"education","lineage":["https://openalex.org/I165779595"]}],"countries":["AU"],"is_corresponding":true,"raw_author_name":"Yuchong Yao","raw_affiliation_strings":["The University of Melbourne, Melbourne, Australia"],"affiliations":[{"raw_affiliation_string":"The University of Melbourne, Melbourne, Australia","institution_ids":["https://openalex.org/I165779595"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031865298","display_name":"Nandakishor Desai","orcid":"https://orcid.org/0000-0001-6491-6171"},"institutions":[{"id":"https://openalex.org/I165779595","display_name":"University of Melbourne","ror":"https://ror.org/01ej9dk98","country_code":"AU","type":"education","lineage":["https://openalex.org/I165779595"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Nandakishor Desai","raw_affiliation_strings":["The University of Melbourne, Melbourne, Australia"],"affiliations":[{"raw_affiliation_string":"The University of Melbourne, Melbourne, Australia","institution_ids":["https://openalex.org/I165779595"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5080554686","display_name":"Marimuthu Palaniswami","orcid":"https://orcid.org/0000-0002-3635-4252"},"institutions":[{"id":"https://openalex.org/I165779595","display_name":"University of Melbourne","ror":"https://ror.org/01ej9dk98","country_code":"AU","type":"education","lineage":["https://openalex.org/I165779595"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Marimuthu Palaniswami","raw_affiliation_strings":["The University of Melbourne, Melbourne, Australia"],"affiliations":[{"raw_affiliation_string":"The University of Melbourne, Melbourne, Australia","institution_ids":["https://openalex.org/I165779595"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5009598097"],"corresponding_institution_ids":["https://openalex.org/I165779595"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.36285256,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"5428","last_page":"5432"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10688","display_name":"Image and Signal Denoising Methods","score":0.5835000276565552,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10688","display_name":"Image and Signal Denoising Methods","score":0.5835000276565552,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10727","display_name":"Ultrasound Imaging and Elastography","score":0.24529999494552612,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T12419","display_name":"Phonocardiography and Auscultation Techniques","score":0.012500000186264515,"subfield":{"id":"https://openalex.org/subfields/2740","display_name":"Pulmonary and Respiratory Medicine"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.6518999934196472},{"id":"https://openalex.org/keywords/speckle-noise","display_name":"Speckle noise","score":0.5898000001907349},{"id":"https://openalex.org/keywords/masking","display_name":"Masking (illustration)","score":0.4505000114440918},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.4189000129699707},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4075999855995178},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.3801000118255615},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.35659998655319214},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.3522999882698059}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7753000259399414},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7422000169754028},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.6518999934196472},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5899999737739563},{"id":"https://openalex.org/C180940675","wikidata":"https://www.wikidata.org/wiki/Q7575045","display_name":"Speckle noise","level":3,"score":0.5898000001907349},{"id":"https://openalex.org/C2777402240","wikidata":"https://www.wikidata.org/wiki/Q6783436","display_name":"Masking (illustration)","level":2,"score":0.4505000114440918},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.4189000129699707},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4075999855995178},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.3801000118255615},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.35659998655319214},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.3522999882698059},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.3314000070095062},{"id":"https://openalex.org/C102290492","wikidata":"https://www.wikidata.org/wiki/Q7575045","display_name":"Speckle pattern","level":2,"score":0.31040000915527344},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.29010000824928284},{"id":"https://openalex.org/C31601959","wikidata":"https://www.wikidata.org/wiki/Q931309","display_name":"Medical imaging","level":2,"score":0.288100004196167},{"id":"https://openalex.org/C101453961","wikidata":"https://www.wikidata.org/wiki/Q7048948","display_name":"Non-local means","level":4,"score":0.26570001244544983},{"id":"https://openalex.org/C35772409","wikidata":"https://www.wikidata.org/wiki/Q1323086","display_name":"Image noise","level":3,"score":0.2603999972343445},{"id":"https://openalex.org/C141379421","wikidata":"https://www.wikidata.org/wiki/Q6094427","display_name":"Iterative reconstruction","level":2,"score":0.2578999996185303},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.2540999948978424}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3746252.3760875","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3746252.3760875","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 34th ACM International Conference on Information and Knowledge Management","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3746252.3760875","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3746252.3760875","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 34th ACM International Conference on Information and Knowledge Management","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W2056370875","https://openalex.org/W2099244020","https://openalex.org/W2113945798","https://openalex.org/W2194775991","https://openalex.org/W2764207251","https://openalex.org/W2913559493","https://openalex.org/W2962785568","https://openalex.org/W2965900506","https://openalex.org/W2971649496","https://openalex.org/W3035524453","https://openalex.org/W3120430728","https://openalex.org/W3159481202","https://openalex.org/W3167568784","https://openalex.org/W4225672218","https://openalex.org/W4312812783","https://openalex.org/W4313156423","https://openalex.org/W4386083093","https://openalex.org/W4387740865","https://openalex.org/W4392694038","https://openalex.org/W4393038802","https://openalex.org/W4400231909","https://openalex.org/W4402952320"],"related_works":[],"abstract_inverted_index":{"Ultrasound":[0],"imaging":[1],"serves":[2],"as":[3,166],"an":[4],"important":[5,44],"clinical":[6,30],"diagnostic":[7,27,45],"modality":[8],"due":[9,62,98],"to":[10,60,63,99],"its":[11,100],"non-invasive,":[12],"radiation-free,":[13],"and":[14,29,66,103,133],"real-time":[15],"capabilities.":[16],"However,":[17],"ultrasound":[18,122],"images":[19],"suffer":[20],"from":[21],"speckle":[22,38],"noise":[23,139,183],"that":[24,57],"significantly":[25],"compromises":[26],"accuracy":[28],"interpretation.":[31],"Traditional":[32],"denoising":[33,97,158],"methods":[34],"are":[35,58],"limited":[36],"by":[37],"noise's":[39],"signal-dependent":[40],"nature,":[41],"often":[42],"removing":[43],"features.":[46],"While":[47],"deep":[48],"learning":[49,70,104,136],"performs":[50,157],"better,":[51],"it":[52],"requires":[53],"large":[54],"labelled":[55],"datasets":[56],"difficult":[59],"obtain":[61],"privacy":[64],"concerns":[65],"annotation":[67],"costs.":[68],"Self-supervised":[69],"through":[71],"masked":[72],"image":[73,96,123],"modeling":[74],"(MIM)":[75],"shows":[76],"potential":[77],"in":[78,167],"addressing":[79],"data":[80],"scarcity,":[81],"but":[82],"conventional":[83,168],"MIM,":[84],"developed":[85],"for":[86,92,121,138],"high-level":[87],"vision":[88],"tasks,":[89],"is":[90],"unsuitable":[91],"low-level":[93],"tasks":[94],"like":[95],"framework":[101,120,180],"architecture":[102,143],"strategy.":[105],"To":[106],"this":[107],"end,":[108],"we":[109],"propose":[110],"Image":[111,114],"Denoising":[112],"Masked":[113],"Modeling":[115],"(ID-MIM),":[116],"the":[117,154,174],"first":[118],"MIM":[119,169],"denoising.":[124],"ID-MIM":[125,179],"incorporates":[126],"a":[127,134,145],"novel":[128],"high-frequency":[129],"oriented":[130],"dual-branch":[131],"masking":[132],"specialized":[135],"objective":[137],"reduction.":[140],"Our":[141],"encoder-only":[142],"features":[144],"multi-scale":[146],"hierarchical":[147],"transformer":[148],"with":[149],"dynamic":[150],"skip":[151],"connections,":[152],"where":[153],"encoder":[155],"directly":[156],"rather":[159],"than":[160],"relying":[161],"on":[162],"separate":[163],"decoder":[164],"reconstruction":[165],"approaches.":[170],"Extensive":[171],"experiments":[172],"demonstrate":[173],"superior":[175],"performance":[176],"of":[177],"our":[178],"across":[181],"diverse":[182],"scenarios,":[184],"establishing":[185],"new":[186],"state-of-the-art":[187],"results.":[188]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-11-10T00:00:00"}
