{"id":"https://openalex.org/W4414196849","doi":"https://doi.org/10.1109/access.2025.3610157","title":"Data Augmentation for Text Classification Using Autoencoders","display_name":"Data Augmentation for Text Classification Using Autoencoders","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4414196849","doi":"https://doi.org/10.1109/access.2025.3610157"},"language":"en","primary_location":{"id":"doi:10.1109/access.2025.3610157","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3610157","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1109/access.2025.3610157","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5020233555","display_name":"Mustafa \u00c7atalta\u015f","orcid":"https://orcid.org/0000-0002-5598-9659"},"institutions":[{"id":"https://openalex.org/I4210117254","display_name":"Konya Technical University","ror":"https://ror.org/02s82rs08","country_code":"TR","type":"education","lineage":["https://openalex.org/I4210117254"]}],"countries":["TR"],"is_corresponding":true,"raw_author_name":"Mustafa Cataltas","raw_affiliation_strings":["Department of Computer Engineering, Konya Technical University, Konya, T&#x00FC;rkiye"],"affiliations":[{"raw_affiliation_string":"Department of Computer Engineering, Konya Technical University, Konya, T&#x00FC;rkiye","institution_ids":["https://openalex.org/I4210117254"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081470277","display_name":"Ilyas Cicekli","orcid":"https://orcid.org/0000-0001-5448-9655"},"institutions":[{"id":"https://openalex.org/I66514158","display_name":"Hacettepe University","ror":"https://ror.org/04kwvgz42","country_code":"TR","type":"education","lineage":["https://openalex.org/I66514158"]}],"countries":["TR"],"is_corresponding":false,"raw_author_name":"Ilyas Cicekli","raw_affiliation_strings":["Department of Computer Engineering, Hacettepe University, Ankara, T&#x00FC;rkiye"],"affiliations":[{"raw_affiliation_string":"Department of Computer Engineering, Hacettepe University, Ankara, T&#x00FC;rkiye","institution_ids":["https://openalex.org/I66514158"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5011188700","display_name":"Nurdan Akhan Baykan","orcid":"https://orcid.org/0000-0002-4289-8889"},"institutions":[{"id":"https://openalex.org/I4210117254","display_name":"Konya Technical University","ror":"https://ror.org/02s82rs08","country_code":"TR","type":"education","lineage":["https://openalex.org/I4210117254"]}],"countries":["TR"],"is_corresponding":false,"raw_author_name":"Nurdan Akhan Baykan","raw_affiliation_strings":["Department of Computer Engineering, Konya Technical University, Konya, T&#x00FC;rkiye"],"affiliations":[{"raw_affiliation_string":"Department of Computer Engineering, Konya Technical University, Konya, T&#x00FC;rkiye","institution_ids":["https://openalex.org/I4210117254"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5020233555"],"corresponding_institution_ids":["https://openalex.org/I4210117254"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":2.8331,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.92403421,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"13","issue":null,"first_page":"161594","last_page":"161604"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.5641999840736389,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.5641999840736389,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/autoencoder","display_name":"Autoencoder","score":0.9265000224113464},{"id":"https://openalex.org/keywords/preprocessor","display_name":"Preprocessor","score":0.652999997138977},{"id":"https://openalex.org/keywords/data-pre-processing","display_name":"Data pre-processing","score":0.5038999915122986},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.49309998750686646},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.47909998893737793},{"id":"https://openalex.org/keywords/test-data","display_name":"Test data","score":0.43799999356269836},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.4327999949455261},{"id":"https://openalex.org/keywords/data-modeling","display_name":"Data modeling","score":0.430400013923645},{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.39010000228881836}],"concepts":[{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.9265000224113464},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7839999794960022},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7635999917984009},{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.652999997138977},{"id":"https://openalex.org/C10551718","wikidata":"https://www.wikidata.org/wiki/Q5227332","display_name":"Data pre-processing","level":2,"score":0.5038999915122986},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.49309998750686646},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.47909998893737793},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.44200000166893005},{"id":"https://openalex.org/C16910744","wikidata":"https://www.wikidata.org/wiki/Q7705759","display_name":"Test data","level":2,"score":0.43799999356269836},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.4327999949455261},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.430400013923645},{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.39010000228881836},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.37770000100135803},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3605000078678131},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.3398999869823456},{"id":"https://openalex.org/C2780724565","wikidata":"https://www.wikidata.org/wiki/Q5227256","display_name":"Data classification","level":2,"score":0.31029999256134033},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.3095000088214874},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.30889999866485596},{"id":"https://openalex.org/C2776145971","wikidata":"https://www.wikidata.org/wiki/Q30673951","display_name":"Labeled data","level":2,"score":0.30869999527931213},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.3050000071525574},{"id":"https://openalex.org/C2781170535","wikidata":"https://www.wikidata.org/wiki/Q30587856","display_name":"Noisy data","level":2,"score":0.3034999966621399},{"id":"https://openalex.org/C21080849","wikidata":"https://www.wikidata.org/wiki/Q13611879","display_name":"Data point","level":2,"score":0.2833999991416931},{"id":"https://openalex.org/C2778915421","wikidata":"https://www.wikidata.org/wiki/Q3643177","display_name":"Performance improvement","level":2,"score":0.28290000557899475},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.26840001344680786},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.266400009393692},{"id":"https://openalex.org/C110083411","wikidata":"https://www.wikidata.org/wiki/Q1744628","display_name":"Statistical classification","level":2,"score":0.26010000705718994},{"id":"https://openalex.org/C148524875","wikidata":"https://www.wikidata.org/wiki/Q6975395","display_name":"F1 score","level":2,"score":0.2572000026702881}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2025.3610157","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3610157","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:b44814f8abf74cbbb37932d036b43730","is_oa":true,"landing_page_url":"https://doaj.org/article/b44814f8abf74cbbb37932d036b43730","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 13, Pp 161594-161604 (2025)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2025.3610157","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3610157","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W2025768430","https://openalex.org/W2064675550","https://openalex.org/W2122538988","https://openalex.org/W2251658415","https://openalex.org/W2251939518","https://openalex.org/W2892131163","https://openalex.org/W2937423263","https://openalex.org/W2971296908","https://openalex.org/W2987479080","https://openalex.org/W2997308257","https://openalex.org/W2998184481","https://openalex.org/W3080764280","https://openalex.org/W3099617520","https://openalex.org/W3152268000","https://openalex.org/W3159754263","https://openalex.org/W3195665292","https://openalex.org/W3196750896","https://openalex.org/W3214297092","https://openalex.org/W4226323522","https://openalex.org/W4242592538","https://openalex.org/W4309773749","https://openalex.org/W4327656064","https://openalex.org/W4365504037","https://openalex.org/W4366698663","https://openalex.org/W4378780764","https://openalex.org/W4385245566","https://openalex.org/W4391514872","https://openalex.org/W4400127166","https://openalex.org/W4401042976","https://openalex.org/W4401530293"],"related_works":[],"abstract_inverted_index":{"Deep":[0],"learning":[1],"models":[2],"have":[3],"greatly":[4],"improved":[5],"various":[6],"natural":[7],"language":[8],"processing":[9],"tasks.":[10,231],"However,":[11],"their":[12],"effectiveness":[13,63],"depends":[14],"on":[15,174],"large":[16],"data":[17,29,39,48,69,167,203],"sets,":[18],"which":[19,86,106,151],"can":[20],"be":[21],"difficult":[22],"to":[23,34,71,120],"acquire.":[24],"To":[25,161],"mitigate":[26],"this":[27],"challenge,":[28],"augmentation":[30,49,70,168,185,204],"techniques":[31],"are":[32,87,107,118,139,143,171],"employed":[33],"artificially":[35],"expand":[36],"the":[37,46,62,73,129,135,146,164,215,220],"training":[38,155],"by":[40],"generating":[41],"synthetic":[42],"samples.":[43],"By":[44],"enriching":[45],"dataset,":[47,150],"enhances":[50],"model":[51,57],"generalization,":[52],"reduces":[53],"overfitting,":[54],"and":[55,98,113,157,181,193],"improves":[56],"performance.":[58],"This":[59,218],"paper":[60],"investigates":[61],"of":[64,75,84,110,115,131,137,153,166,177,190,222],"employing":[65],"autoencoders":[66,85,132,223],"for":[67,195],"text":[68,76,103,226],"enhance":[72],"performance":[74],"classification":[77,149,227],"models.":[78,217],"The":[79,141,198],"research":[80],"compares":[81],"four":[82],"types":[83],"Traditional":[88],"Autoencoder":[89,92,96,100],"(AE),":[90],"Adversarial":[91,95],"(AAE),":[93],"Denoising":[94],"(DAAE),":[97],"Variational":[99],"(VAE).":[101],"Basic":[102],"preprocessing":[104],"techniques,":[105],"lowercasing,":[108],"removal":[109,114],"non-alphanumeric":[111],"characters":[112],"stop":[116],"words,":[117],"applied":[119,187],"all":[121],"documents.":[122],"Additionally,":[123],"label-based":[124],"filtering":[125],"is":[126,186],"applied,":[127],"where":[128],"outputs":[130],"that":[133,201],"contradict":[134],"predictions":[136],"BERT":[138],"eliminated.":[140],"experiments":[142,170],"conducted":[144],"using":[145],"SST-2":[147],"sentiment":[148],"consists":[152],"7,791":[154],"instances":[156],"1,821":[158],"test":[159],"instances.":[160,183],"better":[162,212],"analyze":[163],"impact":[165],"methods,":[169,205],"also":[172],"performed":[173],"smaller":[175],"subsets":[176],"100,":[178],"200,":[179],"400,":[180],"1,000":[182],"Data":[184],"at":[188,207],"ratios":[189],"1:1,":[191],"1:2":[192],"1:4":[194],"these":[196],"subsets.":[197],"results":[199],"demonstrate":[200],"AE-based":[202],"particularly":[206],"a":[208],"1:1":[209],"ratio,":[210],"achieve":[211],"accuracy":[213],"than":[214],"baseline":[216],"underscores":[219],"potential":[221],"in":[224,229],"improving":[225],"outcomes":[228],"NLP":[230]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-10T00:00:00"}
