{"id":"https://openalex.org/W4417317650","doi":"https://doi.org/10.3390/bdcc9120321","title":"A Tabular Data Imputation Technique Using Transformer and Convolutional Neural Networks","display_name":"A Tabular Data Imputation Technique Using Transformer and Convolutional Neural Networks","publication_year":2025,"publication_date":"2025-12-13","ids":{"openalex":"https://openalex.org/W4417317650","doi":"https://doi.org/10.3390/bdcc9120321"},"language":"en","primary_location":{"id":"doi:10.3390/bdcc9120321","is_oa":true,"landing_page_url":"https://doi.org/10.3390/bdcc9120321","pdf_url":"https://www.mdpi.com/2504-2289/9/12/321/pdf?version=1765621033","source":{"id":"https://openalex.org/S4210238752","display_name":"Big Data and Cognitive Computing","issn_l":"2504-2289","issn":["2504-2289"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Big Data and Cognitive Computing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/2504-2289/9/12/321/pdf?version=1765621033","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5071421433","display_name":"Charl\u00e8ne B\u00e9atrice Bridge-Nduwimana","orcid":"https://orcid.org/0000-0002-4505-3224"},"institutions":[{"id":"https://openalex.org/I81605866","display_name":"Sidi Mohamed Ben Abdellah University","ror":"https://ror.org/04efg9a07","country_code":"MA","type":"education","lineage":["https://openalex.org/I81605866"]}],"countries":["MA"],"is_corresponding":true,"raw_author_name":"Charl\u00e8ne B\u00e9atrice Bridge-Nduwimana","raw_affiliation_strings":["Innovative Technologies and Computer Science Laboratory (LT2I), High School of Technology (EST), Sidi Mohamed Ben Abdellah University, Fez 30000, Morocco"],"affiliations":[{"raw_affiliation_string":"Innovative Technologies and Computer Science Laboratory (LT2I), High School of Technology (EST), Sidi Mohamed Ben Abdellah University, Fez 30000, Morocco","institution_ids":["https://openalex.org/I81605866"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120801255","display_name":"Salah Eddine El El Harrauss","orcid":"https://orcid.org/0009-0006-5643-0263"},"institutions":[{"id":"https://openalex.org/I81605866","display_name":"Sidi Mohamed Ben Abdellah University","ror":"https://ror.org/04efg9a07","country_code":"MA","type":"education","lineage":["https://openalex.org/I81605866"]}],"countries":["MA"],"is_corresponding":true,"raw_author_name":"Salah Eddine El Harrauss","raw_affiliation_strings":["Innovative Technologies and Computer Science Laboratory (LT2I), High School of Technology (EST), Sidi Mohamed Ben Abdellah University, Fez 30000, Morocco"],"affiliations":[{"raw_affiliation_string":"Innovative Technologies and Computer Science Laboratory (LT2I), High School of Technology (EST), Sidi Mohamed Ben Abdellah University, Fez 30000, Morocco","institution_ids":["https://openalex.org/I81605866"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021802342","display_name":"Aziza El Ouaazizi","orcid":"https://orcid.org/0000-0002-7554-9300"},"institutions":[{"id":"https://openalex.org/I81605866","display_name":"Sidi Mohamed Ben Abdellah University","ror":"https://ror.org/04efg9a07","country_code":"MA","type":"education","lineage":["https://openalex.org/I81605866"]}],"countries":["MA"],"is_corresponding":false,"raw_author_name":"Aziza El Ouaazizi","raw_affiliation_strings":["Innovative Technologies and Computer Science Laboratory (LT2I), High School of Technology (EST), Sidi Mohamed Ben Abdellah University, Fez 30000, Morocco","Laboratory of Engineering Sciences (LSE), Polydisciplinary Faculty of Taza, Sidi Mohamed Ben Abdellah University, Fez 30000, Morocco"],"affiliations":[{"raw_affiliation_string":"Innovative Technologies and Computer Science Laboratory (LT2I), High School of Technology (EST), Sidi Mohamed Ben Abdellah University, Fez 30000, Morocco","institution_ids":["https://openalex.org/I81605866"]},{"raw_affiliation_string":"Laboratory of Engineering Sciences (LSE), Polydisciplinary Faculty of Taza, Sidi Mohamed Ben Abdellah University, Fez 30000, Morocco","institution_ids":["https://openalex.org/I81605866"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5065223940","display_name":"Majid Ben Yakhlef","orcid":"https://orcid.org/0000-0002-6696-9426"},"institutions":[{"id":"https://openalex.org/I81605866","display_name":"Sidi Mohamed Ben Abdellah University","ror":"https://ror.org/04efg9a07","country_code":"MA","type":"education","lineage":["https://openalex.org/I81605866"]}],"countries":["MA"],"is_corresponding":false,"raw_author_name":"Majid Benyakhlef","raw_affiliation_strings":["Laboratory of Engineering Sciences (LSE), Polydisciplinary Faculty of Taza, Sidi Mohamed Ben Abdellah University, Fez 30000, Morocco"],"affiliations":[{"raw_affiliation_string":"Laboratory of Engineering Sciences (LSE), Polydisciplinary Faculty of Taza, Sidi Mohamed Ben Abdellah University, Fez 30000, Morocco","institution_ids":["https://openalex.org/I81605866"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5071421433","https://openalex.org/A5120801255"],"corresponding_institution_ids":["https://openalex.org/I81605866"],"apc_list":{"value":1400,"currency":"CHF","value_usd":1515},"apc_paid":{"value":1400,"currency":"CHF","value_usd":1515},"fwci":2.7163,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.93034656,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":"9","issue":"12","first_page":"321","last_page":"321"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.3248000144958496,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.3248000144958496,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.164000004529953,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.09019999951124191,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/imputation","display_name":"Imputation (statistics)","score":0.7139000296592712},{"id":"https://openalex.org/keywords/missing-data","display_name":"Missing data","score":0.6933000087738037},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.5146999955177307},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.48399999737739563},{"id":"https://openalex.org/keywords/autoencoder","display_name":"Autoencoder","score":0.44920000433921814},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.42489999532699585},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.40310001373291016},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.39010000228881836}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7437000274658203},{"id":"https://openalex.org/C58041806","wikidata":"https://www.wikidata.org/wiki/Q1660484","display_name":"Imputation (statistics)","level":3,"score":0.7139000296592712},{"id":"https://openalex.org/C9357733","wikidata":"https://www.wikidata.org/wiki/Q6878417","display_name":"Missing data","level":2,"score":0.6933000087738037},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.552299976348877},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.5146999955177307},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.48399999737739563},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4733000099658966},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4526999890804291},{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.44920000433921814},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.42489999532699585},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.40310001373291016},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.39010000228881836},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.3723999857902527},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.3686000108718872},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.3601999878883362},{"id":"https://openalex.org/C24756922","wikidata":"https://www.wikidata.org/wiki/Q1757694","display_name":"Data quality","level":3,"score":0.3183000087738037},{"id":"https://openalex.org/C139945424","wikidata":"https://www.wikidata.org/wiki/Q1940696","display_name":"Mean squared error","level":2,"score":0.29490000009536743},{"id":"https://openalex.org/C114289077","wikidata":"https://www.wikidata.org/wiki/Q3284399","display_name":"Statistical model","level":2,"score":0.29190000891685486},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.2676999866962433},{"id":"https://openalex.org/C10551718","wikidata":"https://www.wikidata.org/wiki/Q5227332","display_name":"Data pre-processing","level":2,"score":0.26660001277923584},{"id":"https://openalex.org/C2778915421","wikidata":"https://www.wikidata.org/wiki/Q3643177","display_name":"Performance improvement","level":2,"score":0.2538999915122986}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.3390/bdcc9120321","is_oa":true,"landing_page_url":"https://doi.org/10.3390/bdcc9120321","pdf_url":"https://www.mdpi.com/2504-2289/9/12/321/pdf?version=1765621033","source":{"id":"https://openalex.org/S4210238752","display_name":"Big Data and Cognitive Computing","issn_l":"2504-2289","issn":["2504-2289"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Big Data and Cognitive Computing","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:2f4cf59539354b5f9f17a11b497a6906","is_oa":true,"landing_page_url":"https://doaj.org/article/2f4cf59539354b5f9f17a11b497a6906","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Big Data and Cognitive Computing, Vol 9, Iss 12, p 321 (2025)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.3390/bdcc9120321","is_oa":true,"landing_page_url":"https://doi.org/10.3390/bdcc9120321","pdf_url":"https://www.mdpi.com/2504-2289/9/12/321/pdf?version=1765621033","source":{"id":"https://openalex.org/S4210238752","display_name":"Big Data and Cognitive Computing","issn_l":"2504-2289","issn":["2504-2289"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Big Data and Cognitive Computing","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4417317650.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Upstream":[0],"processes":[1],"strongly":[2],"influence":[3],"downstream":[4],"analysis":[5],"in":[6,11,73,98,212],"sequential":[7],"data-processing":[8],"workflows,":[9],"particularly":[10],"machine":[12],"learning,":[13],"where":[14],"data":[15,68,103,111,116],"quality":[16],"directly":[17],"affects":[18],"model":[19,43],"performance.":[20],"Conventional":[21],"statistical":[22],"imputations":[23,72],"often":[24],"fail":[25],"to":[26,62,144,152],"capture":[27],"nonlinear":[28],"dependencies,":[29],"while":[30],"deep":[31,47],"learning":[32,48],"approaches":[33],"typically":[34],"lack":[35],"uncertainty":[36,171],"quantification.":[37],"We":[38,93],"introduce":[39],"a":[40,46,57,190,200],"hybrid":[41],"imputation":[42,128,132,154,197],"that":[44,85],"integrates":[45],"autoencoder":[49],"with":[50],"Convolutional":[51],"Neural":[52],"Network":[53],"(CNN)":[54],"layers":[55],"and":[56,78,113,148,163,167],"Transformer-based":[58],"contextual":[59],"modeling":[60],"architecture":[61],"address":[63],"systematic":[64],"variation":[65],"across":[66],"heterogeneous":[67],"sources.":[69],"Performing":[70],"multiple":[71,180,194],"the":[74,127,135,183,186],"autoencoder\u2013transformer":[75],"latent":[76],"space":[77],"averaging":[79],"representations":[80],"provides":[81],"implicit":[82],"batch":[83,91,214],"correction":[84],"suppresses":[86],"context-specific":[87],"remains":[88],"without":[89],"explicit":[90],"identifiers.":[92],"performed":[94],"experiments":[95],"on":[96,177,189],"datasets":[97,178],"which":[99],"10%":[100],"of":[101,185],"missing":[102,110,115],"was":[104,157],"artificially":[105],"introduced":[106],"by":[107,141,149],"completely":[108],"random":[109],"(MCAR)":[112],"non-random":[114],"(MNAR)":[117],"mechanisms.":[118],"They":[119],"demonstrated":[120],"practical":[121,201],"performance,":[122],"jointly":[123],"ranking":[124],"first":[125],"among":[126],"methods":[129],"evaluated.":[130],"This":[131],"technique":[133,198],"reduced":[134],"root":[136],"mean":[137],"square":[138],"error":[139],"(RMSE)":[140],"50%":[142],"compared":[143,151],"denoising":[145],"autoencoders":[146],"(DAE)":[147],"46%":[150],"iterative":[153],"(MICE).":[155],"Performance":[156],"comparable":[158],"for":[159],"adversarial":[160],"models":[161,165],"(GAIN)":[162],"attention-based":[164],"(MIDA),":[166],"both":[168],"provided":[169],"interpretable":[170],"estimates":[172],"(CV":[173],"=":[174],"0.08\u20130.15).":[175],"Validation":[176],"from":[179,193],"sources":[181],"confirmed":[182],"robustness":[184],"technique:":[187],"notably,":[188],"forensic":[191],"dataset":[192],"laboratories,":[195],"our":[196],"achieved":[199],"improvement":[202],"over":[203],"GAIN":[204],"(0.146":[205],"vs.":[206],"0.189":[207],"RMSE),":[208],"highlighting":[209],"its":[210],"effectiveness":[211],"mitigating":[213],"effects.":[215]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-03-11T06:11:40.159057","created_date":"2025-12-15T00:00:00"}
