{"id":"https://openalex.org/W4416017277","doi":"https://doi.org/10.1145/3746252.3760943","title":"MissDDIM: Deterministic and Efficient Conditional Diffusion for Tabular Data Imputation","display_name":"MissDDIM: Deterministic and Efficient Conditional Diffusion for Tabular Data Imputation","publication_year":2025,"publication_date":"2025-11-08","ids":{"openalex":"https://openalex.org/W4416017277","doi":"https://doi.org/10.1145/3746252.3760943"},"language":null,"primary_location":{"id":"doi:10.1145/3746252.3760943","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3746252.3760943","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 34th ACM International Conference on Information and Knowledge Management","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3746252.3760943","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5104278268","display_name":"Youran Zhou","orcid":"https://orcid.org/0009-0001-6831-4634"},"institutions":[{"id":"https://openalex.org/I149704539","display_name":"Deakin University","ror":"https://ror.org/02czsnj07","country_code":"AU","type":"education","lineage":["https://openalex.org/I149704539"]}],"countries":["AU"],"is_corresponding":true,"raw_author_name":"Youran Zhou","raw_affiliation_strings":["Deakin University, Geelong, Victoria, Australia"],"affiliations":[{"raw_affiliation_string":"Deakin University, Geelong, Victoria, Australia","institution_ids":["https://openalex.org/I149704539"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018899731","display_name":"Mohamed Reda Bouadjenek","orcid":"https://orcid.org/0000-0003-1807-430X"},"institutions":[{"id":"https://openalex.org/I149704539","display_name":"Deakin University","ror":"https://ror.org/02czsnj07","country_code":"AU","type":"education","lineage":["https://openalex.org/I149704539"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Mohamed Reda Bouadjenek","raw_affiliation_strings":["Deakin University, Geelong, Victoria, Australia"],"affiliations":[{"raw_affiliation_string":"Deakin University, Geelong, Victoria, Australia","institution_ids":["https://openalex.org/I149704539"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5038741954","display_name":"Sunil Aryal","orcid":"https://orcid.org/0000-0002-6639-6824"},"institutions":[{"id":"https://openalex.org/I149704539","display_name":"Deakin University","ror":"https://ror.org/02czsnj07","country_code":"AU","type":"education","lineage":["https://openalex.org/I149704539"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Sunil Aryal","raw_affiliation_strings":["Deakin University, Geelong, Victoria, Australia"],"affiliations":[{"raw_affiliation_string":"Deakin University, Geelong, Victoria, Australia","institution_ids":["https://openalex.org/I149704539"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5104278268"],"corresponding_institution_ids":["https://openalex.org/I149704539"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.30507754,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"5525","last_page":"5529"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12056","display_name":"Markov Chains and Monte Carlo Methods","score":0.18799999356269836,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12056","display_name":"Markov Chains and Monte Carlo Methods","score":0.18799999356269836,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.11129999905824661,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11304","display_name":"Advanced Neuroimaging Techniques and Applications","score":0.09179999679327011,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/imputation","display_name":"Imputation (statistics)","score":0.7070000171661377},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6643000245094299},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.5376999974250793},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.5156999826431274},{"id":"https://openalex.org/keywords/missing-data","display_name":"Missing data","score":0.4878000020980835},{"id":"https://openalex.org/keywords/importance-sampling","display_name":"Importance sampling","score":0.4343000054359436},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.34549999237060547},{"id":"https://openalex.org/keywords/conditional-probability-distribution","display_name":"Conditional probability distribution","score":0.3343999981880188}],"concepts":[{"id":"https://openalex.org/C58041806","wikidata":"https://www.wikidata.org/wiki/Q1660484","display_name":"Imputation (statistics)","level":3,"score":0.7070000171661377},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6643000245094299},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6484000086784363},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.5376999974250793},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.5156999826431274},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4966999888420105},{"id":"https://openalex.org/C9357733","wikidata":"https://www.wikidata.org/wiki/Q6878417","display_name":"Missing data","level":2,"score":0.4878000020980835},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.47620001435279846},{"id":"https://openalex.org/C52740198","wikidata":"https://www.wikidata.org/wiki/Q1539564","display_name":"Importance sampling","level":3,"score":0.4343000054359436},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.34549999237060547},{"id":"https://openalex.org/C43555835","wikidata":"https://www.wikidata.org/wiki/Q2300258","display_name":"Conditional probability distribution","level":2,"score":0.3343999981880188},{"id":"https://openalex.org/C188198153","wikidata":"https://www.wikidata.org/wiki/Q1613840","display_name":"Limiting","level":2,"score":0.3319000005722046},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.33169999718666077},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.3140000104904175},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.30630001425743103},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2840999960899353},{"id":"https://openalex.org/C158424031","wikidata":"https://www.wikidata.org/wiki/Q1191905","display_name":"Gibbs sampling","level":3,"score":0.2718000113964081},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.26649999618530273},{"id":"https://openalex.org/C149441793","wikidata":"https://www.wikidata.org/wiki/Q200726","display_name":"Probability distribution","level":2,"score":0.266400009393692},{"id":"https://openalex.org/C17618745","wikidata":"https://www.wikidata.org/wiki/Q207509","display_name":"Copula (linguistics)","level":2,"score":0.2644999921321869},{"id":"https://openalex.org/C114289077","wikidata":"https://www.wikidata.org/wiki/Q3284399","display_name":"Statistical model","level":2,"score":0.25940001010894775},{"id":"https://openalex.org/C18653775","wikidata":"https://www.wikidata.org/wiki/Q1333358","display_name":"Joint probability distribution","level":2,"score":0.25839999318122864},{"id":"https://openalex.org/C167723999","wikidata":"https://www.wikidata.org/wiki/Q3773214","display_name":"Sampling distribution","level":2,"score":0.2551000118255615}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3746252.3760943","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3746252.3760943","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 34th ACM International Conference on Information and Knowledge Management","raw_type":"proceedings-article"},{"id":"pmh:oai:figshare.com:article/30631955","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4377196282","display_name":"Figshare","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210132348","host_organization_name":"Figshare (United Kingdom)","host_organization_lineage":["https://openalex.org/I4210132348"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Conference contribution"}],"best_oa_location":{"id":"doi:10.1145/3746252.3760943","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3746252.3760943","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 34th ACM International Conference on Information and Knowledge Management","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":14,"referenced_works":["https://openalex.org/W1966503970","https://openalex.org/W1970059922","https://openalex.org/W1976364950","https://openalex.org/W2064186732","https://openalex.org/W2966501701","https://openalex.org/W3035623224","https://openalex.org/W3043579284","https://openalex.org/W3216660278","https://openalex.org/W4360884927","https://openalex.org/W4382202969","https://openalex.org/W4386075858","https://openalex.org/W4388914362","https://openalex.org/W4390872583","https://openalex.org/W4400436554"],"related_works":[],"abstract_inverted_index":{"Diffusion":[0,66],"models":[1,32],"have":[2],"recently":[3],"emerged":[4],"as":[5],"powerful":[6],"tools":[7],"for":[8,70,163],"missing":[9],"data":[10],"imputation":[11,118,165],"by":[12],"modeling":[13],"the":[14,141,157],"joint":[15],"distribution":[16],"of":[17,143,160],"observed":[18,121,128],"and":[19,39,99,152],"unobserved":[20],"variables.":[21],"However,":[22],"existing":[23],"methods,":[24],"typically":[25],"based":[26],"on":[27,131],"stochastic":[28,74],"denoising":[29],"diffusion":[30,61,145,162],"probabilistic":[31],"(DDPMs),":[33],"suffer":[34],"from":[35,120],"high":[36],"inference":[37,150],"latency":[38],"variable":[40],"outputs,":[41],"limiting":[42],"their":[43],"applicability":[44],"in":[45,55],"real-world":[46,164],"tabular":[47,71],"settings.":[48],"To":[49,103],"address":[50],"these":[51],"deficiencies,":[52],"we":[53,110],"present":[54],"this":[56,90],"paper":[57],"MissDDIM,":[58],"a":[59,92,112],"conditional":[60],"framework":[62],"that":[63,84,115,136],"adapts":[64],"Denoising":[65],"Implicit":[67],"Models":[68],"(DDIM)":[69],"imputation.":[72],"While":[73],"sampling":[75,95],"enables":[76],"diverse":[77],"completions,":[78],"it":[79],"also":[80],"introduces":[81],"output":[82],"variability":[83],"complicates":[85],"downstream":[86],"processing.":[87],"MissDDIM":[88,137],"replaces":[89],"with":[91],"deterministic,":[93],"non-Markovian":[94],"path,":[96],"yielding":[97],"faster":[98],"more":[100],"consistent":[101],"imputations.":[102],"better":[104],"leverage":[105],"incomplete":[106],"inputs":[107],"during":[108],"training,":[109],"introduce":[111],"self-masking":[113],"strategy":[114],"dynamically":[116],"constructs":[117],"targets":[119],"features-enabling":[122],"robust":[123],"conditioning":[124],"without":[125],"requiring":[126],"fully":[127],"data.":[129],"Experiments":[130],"five":[132],"benchmark":[133],"datasets":[134],"demonstrate":[135],"matches":[138],"or":[139],"exceeds":[140],"accuracy":[142],"state-of-the-art":[144],"models,":[146],"while":[147],"significantly":[148],"improving":[149],"speed":[151],"stability.":[153],"These":[154],"results":[155],"highlight":[156],"practical":[158],"value":[159],"deterministic":[161],"tasks.":[166]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-11-08T00:00:00"}
