{"id":"https://openalex.org/W3199849862","doi":"https://doi.org/10.1109/tai.2021.3114390","title":"Toward Text Data Augmentation for Sentiment Analysis","display_name":"Toward Text Data Augmentation for Sentiment Analysis","publication_year":2021,"publication_date":"2021-09-21","ids":{"openalex":"https://openalex.org/W3199849862","doi":"https://doi.org/10.1109/tai.2021.3114390","mag":"3199849862"},"language":"en","primary_location":{"id":"doi:10.1109/tai.2021.3114390","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tai.2021.3114390","pdf_url":null,"source":{"id":"https://openalex.org/S4210169448","display_name":"IEEE Transactions on Artificial Intelligence","issn_l":"2691-4581","issn":["2691-4581"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://hdl.handle.net/11368/3055528","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5043191034","display_name":"Hugo Abonizio","orcid":"https://orcid.org/0000-0001-5208-0290"},"institutions":[{"id":"https://openalex.org/I127110123","display_name":"Universidade Estadual de Londrina","ror":"https://ror.org/01585b035","country_code":"BR","type":"education","lineage":["https://openalex.org/I127110123"]}],"countries":["BR"],"is_corresponding":true,"raw_author_name":"Hugo Queiroz Abonizio","raw_affiliation_strings":["Computer Science Department, State University of Londrina (UEL), Londrina, Brazil"],"affiliations":[{"raw_affiliation_string":"Computer Science Department, State University of Londrina (UEL), Londrina, Brazil","institution_ids":["https://openalex.org/I127110123"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089479540","display_name":"Emerson Cabrera Para\u00edso","orcid":"https://orcid.org/0000-0002-6740-7855"},"institutions":[{"id":"https://openalex.org/I176838256","display_name":"Pontif\u00edcia Universidade Cat\u00f3lica do Paran\u00e1","ror":"https://ror.org/02x1vjk79","country_code":"BR","type":"education","lineage":["https://openalex.org/I176838256"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Emerson Cabrera Paraiso","raw_affiliation_strings":["Informatics Department, Pontificia Universidade Catolica do Parana (PUCPR), Curitiba, Brazil"],"affiliations":[{"raw_affiliation_string":"Informatics Department, Pontificia Universidade Catolica do Parana (PUCPR), Curitiba, Brazil","institution_ids":["https://openalex.org/I176838256"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5004953377","display_name":"Sylvio Barbon","orcid":"https://orcid.org/0000-0002-4988-0702"},"institutions":[{"id":"https://openalex.org/I127110123","display_name":"Universidade Estadual de Londrina","ror":"https://ror.org/01585b035","country_code":"BR","type":"education","lineage":["https://openalex.org/I127110123"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Sylvio Barbon","raw_affiliation_strings":["Computer Science Department, State University of Londrina (UEL), Londrina, Brazil"],"affiliations":[{"raw_affiliation_string":"Computer Science Department, State University of Londrina (UEL), Londrina, Brazil","institution_ids":["https://openalex.org/I127110123"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5043191034"],"corresponding_institution_ids":["https://openalex.org/I127110123"],"apc_list":null,"apc_paid":null,"fwci":5.5899,"has_fulltext":false,"cited_by_count":62,"citation_normalized_percentile":{"value":0.96550655,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":"3","issue":"5","first_page":"657","last_page":"668"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8292636275291443},{"id":"https://openalex.org/keywords/sentiment-analysis","display_name":"Sentiment analysis","score":0.7725620269775391},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.661974310874939},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.5631572008132935},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5380707383155823},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.5200669169425964},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.47900599241256714},{"id":"https://openalex.org/keywords/machine-translation","display_name":"Machine translation","score":0.46600183844566345},{"id":"https://openalex.org/keywords/external-data-representation","display_name":"External Data Representation","score":0.42421048879623413},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.4225081205368042},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.41787663102149963},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3765689432621002}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8292636275291443},{"id":"https://openalex.org/C66402592","wikidata":"https://www.wikidata.org/wiki/Q2271421","display_name":"Sentiment analysis","level":2,"score":0.7725620269775391},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.661974310874939},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.5631572008132935},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5380707383155823},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.5200669169425964},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.47900599241256714},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.46600183844566345},{"id":"https://openalex.org/C116409475","wikidata":"https://www.wikidata.org/wiki/Q1385056","display_name":"External Data Representation","level":2,"score":0.42421048879623413},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.4225081205368042},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.41787663102149963},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3765689432621002},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tai.2021.3114390","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tai.2021.3114390","pdf_url":null,"source":{"id":"https://openalex.org/S4210169448","display_name":"IEEE Transactions on Artificial Intelligence","issn_l":"2691-4581","issn":["2691-4581"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Artificial Intelligence","raw_type":"journal-article"},{"id":"pmh:oai:arts.units.it:11368/3055528","is_oa":true,"landing_page_url":"https://hdl.handle.net/11368/3055528","pdf_url":null,"source":{"id":"https://openalex.org/S4306400480","display_name":"ArTS Archivio della ricerca di Trieste (University of Trieste https://www.units.it/)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I142444530","host_organization_name":"University of Trieste","host_organization_lineage":["https://openalex.org/I142444530"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/article"}],"best_oa_location":{"id":"pmh:oai:arts.units.it:11368/3055528","is_oa":true,"landing_page_url":"https://hdl.handle.net/11368/3055528","pdf_url":null,"source":{"id":"https://openalex.org/S4306400480","display_name":"ArTS Archivio della ricerca di Trieste (University of Trieste https://www.units.it/)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I142444530","host_organization_name":"University of Trieste","host_organization_lineage":["https://openalex.org/I142444530"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.7099999785423279}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":86,"referenced_works":["https://openalex.org/W153185079","https://openalex.org/W1505629914","https://openalex.org/W1506806321","https://openalex.org/W1546425147","https://openalex.org/W1832693441","https://openalex.org/W2061873838","https://openalex.org/W2064675550","https://openalex.org/W2066606993","https://openalex.org/W2067624665","https://openalex.org/W2081580037","https://openalex.org/W2095705004","https://openalex.org/W2101234009","https://openalex.org/W2119821739","https://openalex.org/W2132019450","https://openalex.org/W2132555391","https://openalex.org/W2146334809","https://openalex.org/W2165698076","https://openalex.org/W2250539671","https://openalex.org/W2251658415","https://openalex.org/W2306941105","https://openalex.org/W2401379394","https://openalex.org/W2508865106","https://openalex.org/W2805774077","https://openalex.org/W2810374907","https://openalex.org/W2889149926","https://openalex.org/W2889326796","https://openalex.org/W2892068161","https://openalex.org/W2892131163","https://openalex.org/W2896556344","https://openalex.org/W2905266130","https://openalex.org/W2908694192","https://openalex.org/W2912877146","https://openalex.org/W2920582597","https://openalex.org/W2923014074","https://openalex.org/W2949736877","https://openalex.org/W2953356739","https://openalex.org/W2954996726","https://openalex.org/W2962772844","https://openalex.org/W2963212250","https://openalex.org/W2963216553","https://openalex.org/W2963329574","https://openalex.org/W2963545917","https://openalex.org/W2963993537","https://openalex.org/W2964120993","https://openalex.org/W2964236337","https://openalex.org/W2970418174","https://openalex.org/W2971296908","https://openalex.org/W2979826702","https://openalex.org/W2985353426","https://openalex.org/W2986191653","https://openalex.org/W2997200074","https://openalex.org/W2998184481","https://openalex.org/W3034898894","https://openalex.org/W3034999214","https://openalex.org/W3035542229","https://openalex.org/W3094173182","https://openalex.org/W3096660185","https://openalex.org/W3105966348","https://openalex.org/W3106234277","https://openalex.org/W3115047749","https://openalex.org/W3135939397","https://openalex.org/W3155393281","https://openalex.org/W4289145467","https://openalex.org/W6631190155","https://openalex.org/W6638523607","https://openalex.org/W6638545294","https://openalex.org/W6674330103","https://openalex.org/W6675354045","https://openalex.org/W6680110197","https://openalex.org/W6682691769","https://openalex.org/W6685053522","https://openalex.org/W6691459498","https://openalex.org/W6727099177","https://openalex.org/W6743928203","https://openalex.org/W6757415572","https://openalex.org/W6757817989","https://openalex.org/W6763165154","https://openalex.org/W6763701032","https://openalex.org/W6765939562","https://openalex.org/W6768851824","https://openalex.org/W6774569510","https://openalex.org/W6776476930","https://openalex.org/W6779570082","https://openalex.org/W6784056776","https://openalex.org/W6784141058","https://openalex.org/W6940318546"],"related_works":["https://openalex.org/W2548633793","https://openalex.org/W3089396779","https://openalex.org/W3132372214","https://openalex.org/W2596247554","https://openalex.org/W4301373556","https://openalex.org/W2941935829","https://openalex.org/W2438765327","https://openalex.org/W3013279174","https://openalex.org/W4317653575","https://openalex.org/W4224284088"],"abstract_inverted_index":{"A":[0],"significant":[1],"part":[2],"of":[3,23,41,60,69,85,113,146,156,170,176,220],"natural":[4],"language":[5,125],"processing":[6],"(NLP)":[7],"techniques":[8],"for":[9,32,188],"sentiment":[10,26,235],"analysis":[11,27,236],"is":[12],"based":[13],"on":[14],"supervised":[15],"methods,":[16,46],"which":[17],"are":[18],"affected":[19],"by":[20,194],"the":[21,58,65,81,154,184,196,199,218],"quality":[22,34,68],"data.":[24,43],"Therefore,":[25],"needs":[28],"to":[29,56,72,143,152,203,208,214],"be":[30],"prepared":[31],"data":[33,62,92,98,151],"issues,":[35],"such":[36,89],"as":[37,90],"imbalance":[38],"and":[39,63,67,83,96,123,135,149,164,173,224,237],"lack":[40],"labeled":[42],"Data":[44],"augmentation":[45,87,222],"widely":[47],"adopted":[48],"in":[49,160,234],"image":[50],"classification":[51,102],"tasks,":[52],"include":[53,217],"data-space":[54],"solutions":[55],"tackle":[57],"problem":[59],"limited":[61,150],"enhance":[64],"size":[66],"training":[70],"datasets":[71,142,148,200],"provide":[73,144,165],"better":[74],"models.":[75],"In":[76],"this":[77,215],"work,":[78],"we":[79],"study":[80],"advantages":[82],"drawbacks":[84],"text":[86],"methods":[88,175,223],"easy":[91],"augmentation,":[93],"back-translation,":[94],"BART,":[95],"pretrained":[97],"augmentor)":[99],"with":[100,127],"recent":[101,231],"algorithms":[103],"(long":[104],"short-term":[105],"memory,":[106],"convolutional":[107],"neural":[108],"network,":[109],"bidirectional":[110],"encoder":[111],"representations":[112],"transformers,":[114],"support":[115],"vector":[116],"machine,":[117],"gated":[118],"recurrent":[119],"units,":[120],"random":[121],"forests,":[122],"enhanced":[124],"representation":[126],"informative":[128],"entities,":[129],"that":[130],"have":[131,204],"attracted":[132],"sentiment-analysis":[133,141],"researchers":[134],"industry":[136],"applications.":[137],"We":[138],"explored":[139],"seven":[140],"scenarios":[145],"imbalanced":[147],"discuss":[153],"influence":[155],"a":[157],"given":[158],"classifier":[159],"overcoming":[161],"these":[162],"problems,":[163],"insights":[166],"into":[167],"promising":[168],"combinations":[169],"transformation,":[171],"paraphrasing,":[172],"generation":[174],"sentence":[177],"augmentation.":[178],"The":[179,212],"results":[180],"revealed":[181],"improvements":[182],"from":[183,230],"augmented":[185],"dataset,":[186],"mainly":[187],"reduced":[189],"datasets.":[190],"Furthermore,":[191],"when":[192],"balanced":[193],"augmenting":[195],"minority":[197],"class,":[198],"were":[201],"found":[202],"improved":[205],"quality,":[206],"leading":[207],"more":[209],"robust":[210],"classifiers.":[211],"contributions":[213],"article":[216],"taxonomy":[219],"NLP":[221],"their":[225],"efficiency":[226],"over":[227],"several":[228],"classifiers":[229],"research":[232],"trends":[233],"related":[238],"fields.":[239]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":18},{"year":2024,"cited_by_count":22},{"year":2023,"cited_by_count":11},{"year":2022,"cited_by_count":7}],"updated_date":"2026-03-18T14:38:29.013473","created_date":"2021-09-27T00:00:00"}
