{"id":"https://openalex.org/W4414267126","doi":"https://doi.org/10.14778/3750601.3750667","title":"TARImpute: Task-Aware Auto-Recommender System for Missing Value Imputation Algorithms with Clustering Case Studies","display_name":"TARImpute: Task-Aware Auto-Recommender System for Missing Value Imputation Algorithms with Clustering Case Studies","publication_year":2025,"publication_date":"2025-08-01","ids":{"openalex":"https://openalex.org/W4414267126","doi":"https://doi.org/10.14778/3750601.3750667"},"language":"en","primary_location":{"id":"doi:10.14778/3750601.3750667","is_oa":false,"landing_page_url":"https://doi.org/10.14778/3750601.3750667","pdf_url":null,"source":{"id":"https://openalex.org/S4210226185","display_name":"Proceedings of the VLDB Endowment","issn_l":"2150-8097","issn":["2150-8097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the VLDB Endowment","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5035726597","display_name":"Xiaoou Ding","orcid":"https://orcid.org/0000-0002-9426-1820"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoou Ding","raw_affiliation_strings":["Harbin Institute of Technology, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Harbin Institute of Technology, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047882464","display_name":"Yanshuo Liu","orcid":"https://orcid.org/0000-0002-2916-8339"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanshuo Liu","raw_affiliation_strings":["Harbin Institute of Technology, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Harbin Institute of Technology, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057666135","display_name":"Zhounan Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhounan Chen","raw_affiliation_strings":["Harbin Institute of Technology, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Harbin Institute of Technology, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100396644","display_name":"Hongzhi Wang","orcid":"https://orcid.org/0000-0002-4097-8703"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongzhi Wang","raw_affiliation_strings":["Harbin Institute of Technology, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Harbin Institute of Technology, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100337643","display_name":"Chen Wang","orcid":"https://orcid.org/0000-0003-0204-2362"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chen Wang","raw_affiliation_strings":["Tsinghua University, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tsinghua University, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5115591736","display_name":"Jianmin Wang","orcid":"https://orcid.org/0009-0008-2668-0047"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianmin Wang","raw_affiliation_strings":["Tsinghua University, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tsinghua University, China","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.11622431,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"18","issue":"12","first_page":"5343","last_page":"5346"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10637","display_name":"Advanced Clustering Algorithms Research","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9930999875068665,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/imputation","display_name":"Imputation (statistics)","score":0.8632000088691711},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.7200000286102295},{"id":"https://openalex.org/keywords/missing-data","display_name":"Missing data","score":0.6420000195503235},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.4004000127315521},{"id":"https://openalex.org/keywords/propagation-of-uncertainty","display_name":"Propagation of uncertainty","score":0.27900001406669617}],"concepts":[{"id":"https://openalex.org/C58041806","wikidata":"https://www.wikidata.org/wiki/Q1660484","display_name":"Imputation (statistics)","level":3,"score":0.8632000088691711},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.7200000286102295},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6880999803543091},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.6488999724388123},{"id":"https://openalex.org/C9357733","wikidata":"https://www.wikidata.org/wiki/Q6878417","display_name":"Missing data","level":2,"score":0.6420000195503235},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.4004000127315521},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3828999996185303},{"id":"https://openalex.org/C123614077","wikidata":"https://www.wikidata.org/wiki/Q1364905","display_name":"Propagation of uncertainty","level":2,"score":0.27900001406669617},{"id":"https://openalex.org/C103088060","wikidata":"https://www.wikidata.org/wiki/Q1062839","display_name":"Error detection and correction","level":2,"score":0.2777000069618225},{"id":"https://openalex.org/C111442797","wikidata":"https://www.wikidata.org/wiki/Q7291446","display_name":"Rand index","level":3,"score":0.2635999917984009},{"id":"https://openalex.org/C2779714256","wikidata":"https://www.wikidata.org/wiki/Q25305062","display_name":"Multiple Models","level":2,"score":0.26249998807907104}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.14778/3750601.3750667","is_oa":false,"landing_page_url":"https://doi.org/10.14778/3750601.3750667","pdf_url":null,"source":{"id":"https://openalex.org/S4210226185","display_name":"Proceedings of the VLDB Endowment","issn_l":"2150-8097","issn":["2150-8097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the VLDB Endowment","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":7,"referenced_works":["https://openalex.org/W2953048192","https://openalex.org/W3006419771","https://openalex.org/W4283070713","https://openalex.org/W4293210185","https://openalex.org/W4320030233","https://openalex.org/W4400909535","https://openalex.org/W4404181119"],"related_works":[],"abstract_inverted_index":{"Missing":[0],"data":[1,7,119],"prevalent":[2],"in":[3],"information":[4],"systems":[5],"impacts":[6],"diversity":[8],"and":[9,20,88,120],"fidelity,":[10],"which":[11],"systematically":[12],"degrade":[13],"clustering":[14,109],"performance":[15],"through":[16],"biased":[17],"similarity":[18],"measures":[19],"unstable":[21],"cluster":[22],"boundaries.":[23],"Current":[24],"large-scale":[25],"environments":[26],"lack":[27],"standardized":[28],"imputation-clustering":[29,76],"pipelines,":[30],"as":[31],"existing":[32],"methods":[33,103],"operate":[34],"independently":[35],"of":[36,75,84,95],"downstream":[37],"tasks":[38],"without":[39],"analyzing":[40],"error":[41,86],"propagation":[42],"effects,":[43],"leading":[44],"to":[45,104,123],"unreliable":[46],"results.":[47],"To":[48],"address":[49],"this,":[50],"we":[51],"propose":[52],"TARImpute,":[53],"a":[54],"Task-Aware":[55],"auto-Recommender":[56],"system":[57],"for":[58,62,72,92,117],"missing":[59],"value":[60],"imputation":[61,85,97,102],"clustering.":[63],"It":[64],"owns":[65],"three":[66],"integrated":[67],"features:":[68],"Imputation":[69],"Impact":[70],"Profiler":[71],"quantitative":[73],"evaluation":[74],"interactions,":[77],"Error":[78],"Propagation":[79],"Interpreter":[80],"enabling":[81],"explainable":[82],"modeling":[83],"diffusion,":[87],"Adaptive":[89],"Strategy":[90],"Optimizer":[91],"dynamic":[93],"selection":[94],"optimal":[96],"methods.":[98],"TARImpute":[99,111],"provides":[100,113],"state-of-the-art":[101],"evaluate":[105],"their":[106],"effects":[107],"on":[108],"tasks.":[110,126],"also":[112],"robust,":[114],"interpretable":[115],"solutions":[116],"low-quality":[118],"shows":[121],"extensibility":[122],"other":[124],"analytical":[125]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
