{"id":"https://openalex.org/W4399174541","doi":"https://doi.org/10.1145/3654929","title":"Certain and Approximately Certain Models for Statistical Learning","display_name":"Certain and Approximately Certain Models for Statistical Learning","publication_year":2024,"publication_date":"2024-05-29","ids":{"openalex":"https://openalex.org/W4399174541","doi":"https://doi.org/10.1145/3654929"},"language":"en","primary_location":{"id":"doi:10.1145/3654929","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3654929","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3654929","source":{"id":"https://openalex.org/S4387289859","display_name":"Proceedings of the ACM on Management of Data","issn_l":"2836-6573","issn":["2836-6573"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Management of Data","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3654929","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5031301229","display_name":"Cheng Zhen","orcid":"https://orcid.org/0009-0001-0560-8926"},"institutions":[{"id":"https://openalex.org/I131249849","display_name":"Oregon State University","ror":"https://ror.org/00ysfqy60","country_code":"US","type":"education","lineage":["https://openalex.org/I131249849"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Cheng Zhen","raw_affiliation_strings":["Oregon State University, Corvallis, USA"],"raw_orcid":"https://orcid.org/0009-0001-0560-8926","affiliations":[{"raw_affiliation_string":"Oregon State University, Corvallis, USA","institution_ids":["https://openalex.org/I131249849"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5093524857","display_name":"Nischal Aryal","orcid":"https://orcid.org/0009-0006-9673-9492"},"institutions":[{"id":"https://openalex.org/I131249849","display_name":"Oregon State University","ror":"https://ror.org/00ysfqy60","country_code":"US","type":"education","lineage":["https://openalex.org/I131249849"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Nischal Aryal","raw_affiliation_strings":["Oregon State University, Corvallis, USA"],"raw_orcid":"https://orcid.org/0009-0006-9673-9492","affiliations":[{"raw_affiliation_string":"Oregon State University, Corvallis, USA","institution_ids":["https://openalex.org/I131249849"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008664449","display_name":"Arash Termehchy","orcid":"https://orcid.org/0009-0007-2213-6303"},"institutions":[{"id":"https://openalex.org/I131249849","display_name":"Oregon State University","ror":"https://ror.org/00ysfqy60","country_code":"US","type":"education","lineage":["https://openalex.org/I131249849"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Arash Termehchy","raw_affiliation_strings":["Oregon State University, Corvallis, USA"],"raw_orcid":"https://orcid.org/0009-0007-2213-6303","affiliations":[{"raw_affiliation_string":"Oregon State University, Corvallis, USA","institution_ids":["https://openalex.org/I131249849"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5081520030","display_name":"Amandeep Singh Chabada","orcid":"https://orcid.org/0009-0008-5435-0598"},"institutions":[{"id":"https://openalex.org/I131249849","display_name":"Oregon State University","ror":"https://ror.org/00ysfqy60","country_code":"US","type":"education","lineage":["https://openalex.org/I131249849"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Amandeep Singh Chabada","raw_affiliation_strings":["Oregon State University, Corvallis, USA"],"raw_orcid":"https://orcid.org/0009-0008-5435-0598","affiliations":[{"raw_affiliation_string":"Oregon State University, Corvallis, USA","institution_ids":["https://openalex.org/I131249849"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5031301229"],"corresponding_institution_ids":["https://openalex.org/I131249849"],"apc_list":null,"apc_paid":null,"fwci":0.6623,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.73087886,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":"2","issue":"3","first_page":"1","last_page":"25"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9948999881744385,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/imputation","display_name":"Imputation (statistics)","score":0.8679847717285156},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8090270757675171},{"id":"https://openalex.org/keywords/missing-data","display_name":"Missing data","score":0.7924361228942871},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5566838979721069},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5394810438156128},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.46222934126853943},{"id":"https://openalex.org/keywords/real-world-data","display_name":"Real world data","score":0.45870599150657654},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.1319105625152588}],"concepts":[{"id":"https://openalex.org/C58041806","wikidata":"https://www.wikidata.org/wiki/Q1660484","display_name":"Imputation (statistics)","level":3,"score":0.8679847717285156},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8090270757675171},{"id":"https://openalex.org/C9357733","wikidata":"https://www.wikidata.org/wiki/Q6878417","display_name":"Missing data","level":2,"score":0.7924361228942871},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5566838979721069},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5394810438156128},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.46222934126853943},{"id":"https://openalex.org/C3020493868","wikidata":"https://www.wikidata.org/wiki/Q55631277","display_name":"Real world data","level":2,"score":0.45870599150657654},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.1319105625152588}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3654929","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3654929","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3654929","source":{"id":"https://openalex.org/S4387289859","display_name":"Proceedings of the ACM on Management of Data","issn_l":"2836-6573","issn":["2836-6573"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Management of Data","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1145/3654929","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3654929","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3654929","source":{"id":"https://openalex.org/S4387289859","display_name":"Proceedings of the ACM on Management of Data","issn_l":"2836-6573","issn":["2836-6573"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Management of Data","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4399174541.pdf"},"referenced_works_count":12,"referenced_works":["https://openalex.org/W2132862423","https://openalex.org/W2480680997","https://openalex.org/W2548122763","https://openalex.org/W2809993608","https://openalex.org/W3029062663","https://openalex.org/W3033623677","https://openalex.org/W3147796863","https://openalex.org/W4221143014","https://openalex.org/W4381329328","https://openalex.org/W6926378856","https://openalex.org/W6945233569","https://openalex.org/W6959643953"],"related_works":["https://openalex.org/W2181530120","https://openalex.org/W4211215373","https://openalex.org/W2024529227","https://openalex.org/W2055961818","https://openalex.org/W1574575415","https://openalex.org/W3144172081","https://openalex.org/W3179858851","https://openalex.org/W3028371478","https://openalex.org/W2081476516","https://openalex.org/W2581984549"],"abstract_inverted_index":{"Real-world":[0],"data":[1,34,51,58,72,123],"is":[2,43,103],"often":[3],"incomplete":[4],"and":[5,25,28,59,95,119],"contains":[6],"missing":[7,33,53],"values.":[8],"To":[9],"train":[10],"accurate":[11,47,76,97],"models":[12,48,77,98],"over":[13],"real-world":[14],"datasets,":[15],"users":[16],"need":[17],"to":[18,45,74,91],"spend":[19],"a":[20,64],"substantial":[21],"amount":[22,116],"of":[23,71,117],"time":[24,118],"resources":[26],"imputing":[27],"finding":[29],"proper":[30],"values":[31,54],"for":[32,55,67,122],"items.":[35],"In":[36],"this":[37,93],"paper,":[38],"we":[39],"demonstrate":[40],"that":[41,109],"it":[42],"possible":[44],"learn":[46,75],"directly":[49],"from":[50],"with":[52,88],"certain":[56],"training":[57],"target":[60],"models.":[61],"We":[62,84],"propose":[63],"unified":[65],"approach":[66],"checking":[68],"the":[69,115],"necessity":[70,94],"imputation":[73,102,124],"across":[78],"various":[79],"widely-used":[80],"machine":[81],"learning":[82],"paradigms.":[83],"build":[85],"efficient":[86],"algorithms":[87,112],"theoretical":[89],"guarantees":[90],"check":[92],"return":[96],"in":[99],"cases":[100],"where":[101],"unnecessary.":[104],"Our":[105],"extensive":[106],"experiments":[107],"indicate":[108],"our":[110],"proposed":[111],"significantly":[113],"reduce":[114],"effort":[120],"needed":[121],"without":[125],"imposing":[126],"considerable":[127],"computational":[128],"overhead.":[129]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
