{"id":"https://openalex.org/W2792682186","doi":"https://doi.org/10.1007/s10588-018-9266-8","title":"The impact of preprocessing steps on the accuracy of machine learning algorithms in sentiment analysis","display_name":"The impact of preprocessing steps on the accuracy of machine learning algorithms in sentiment analysis","publication_year":2018,"publication_date":"2018-03-16","ids":{"openalex":"https://openalex.org/W2792682186","doi":"https://doi.org/10.1007/s10588-018-9266-8","mag":"2792682186"},"language":"en","primary_location":{"id":"doi:10.1007/s10588-018-9266-8","is_oa":false,"landing_page_url":"https://doi.org/10.1007/s10588-018-9266-8","pdf_url":null,"source":{"id":"https://openalex.org/S47778307","display_name":"Computational and Mathematical Organization Theory","issn_l":"1381-298X","issn":["1381-298X","1572-9346"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computational and Mathematical Organization Theory","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5108686506","display_name":"Saqib Alam","orcid":null},"institutions":[{"id":"https://openalex.org/I27357992","display_name":"Dalian University of Technology","ror":"https://ror.org/023hj5876","country_code":"CN","type":"education","lineage":["https://openalex.org/I27357992"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Saqib Alam","raw_affiliation_strings":["Department of Electronic Information and Electrical Engineering, Dalian University of Technology, Black Building, Linggong Road No. 2, Ganjingzi District, Dalian, 116024, People\u2019s Republic of China","Department of Electronic Information and Electrical Engineering, Dalian University of Technology, Black Building, Linggong Road No. 2, Ganjingzi District, Dalian, 116024, People's Republic of China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Electronic Information and Electrical Engineering, Dalian University of Technology, Black Building, Linggong Road No. 2, Ganjingzi District, Dalian, 116024, People\u2019s Republic of China","institution_ids":["https://openalex.org/I27357992"]},{"raw_affiliation_string":"Department of Electronic Information and Electrical Engineering, Dalian University of Technology, Black Building, Linggong Road No. 2, Ganjingzi District, Dalian, 116024, People's Republic of China","institution_ids":["https://openalex.org/I27357992"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5067703807","display_name":"Nianmin Yao","orcid":"https://orcid.org/0000-0001-9705-6649"},"institutions":[{"id":"https://openalex.org/I27357992","display_name":"Dalian University of Technology","ror":"https://ror.org/023hj5876","country_code":"CN","type":"education","lineage":["https://openalex.org/I27357992"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Nianmin Yao","raw_affiliation_strings":["Department of Electronic Information and Electrical Engineering, Dalian University of Technology, Black Building, Linggong Road No. 2, Ganjingzi District, Dalian, 116024, People\u2019s Republic of China","Department of Electronic Information and Electrical Engineering, Dalian University of Technology, Black Building, Linggong Road No. 2, Ganjingzi District, Dalian, 116024, People's Republic of China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Electronic Information and Electrical Engineering, Dalian University of Technology, Black Building, Linggong Road No. 2, Ganjingzi District, Dalian, 116024, People\u2019s Republic of China","institution_ids":["https://openalex.org/I27357992"]},{"raw_affiliation_string":"Department of Electronic Information and Electrical Engineering, Dalian University of Technology, Black Building, Linggong Road No. 2, Ganjingzi District, Dalian, 116024, People's Republic of China","institution_ids":["https://openalex.org/I27357992"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":{"value":2090,"currency":"EUR","value_usd":2690},"apc_paid":null,"fwci":3.717,"has_fulltext":false,"cited_by_count":141,"citation_normalized_percentile":{"value":0.94401421,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":"25","issue":"3","first_page":"319","last_page":"335"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11326","display_name":"Stock Market Forecasting Methods","score":0.9868999719619751,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7773313522338867},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7140060663223267},{"id":"https://openalex.org/keywords/preprocessor","display_name":"Preprocessor","score":0.7054961919784546},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.6798903942108154},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.650402843952179},{"id":"https://openalex.org/keywords/naive-bayes-classifier","display_name":"Naive Bayes classifier","score":0.6147809624671936},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.6127688884735107},{"id":"https://openalex.org/keywords/data-pre-processing","display_name":"Data pre-processing","score":0.5272233486175537},{"id":"https://openalex.org/keywords/statistical-classification","display_name":"Statistical classification","score":0.4986293315887451},{"id":"https://openalex.org/keywords/sentiment-analysis","display_name":"Sentiment analysis","score":0.48113834857940674},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4238974452018738}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7773313522338867},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7140060663223267},{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.7054961919784546},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6798903942108154},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.650402843952179},{"id":"https://openalex.org/C52001869","wikidata":"https://www.wikidata.org/wiki/Q812530","display_name":"Naive Bayes classifier","level":3,"score":0.6147809624671936},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.6127688884735107},{"id":"https://openalex.org/C10551718","wikidata":"https://www.wikidata.org/wiki/Q5227332","display_name":"Data pre-processing","level":2,"score":0.5272233486175537},{"id":"https://openalex.org/C110083411","wikidata":"https://www.wikidata.org/wiki/Q1744628","display_name":"Statistical classification","level":2,"score":0.4986293315887451},{"id":"https://openalex.org/C66402592","wikidata":"https://www.wikidata.org/wiki/Q2271421","display_name":"Sentiment analysis","level":2,"score":0.48113834857940674},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4238974452018738}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1007/s10588-018-9266-8","is_oa":false,"landing_page_url":"https://doi.org/10.1007/s10588-018-9266-8","pdf_url":null,"source":{"id":"https://openalex.org/S47778307","display_name":"Computational and Mathematical Organization Theory","issn_l":"1381-298X","issn":["1381-298X","1572-9346"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computational and Mathematical Organization Theory","raw_type":"journal-article"},{"id":"pmh:oai:RePEc:spr:comaot:v:25:y:2019:i:3:d:10.1007_s10588-018-9266-8","is_oa":false,"landing_page_url":"http://link.springer.com/10.1007/s10588-018-9266-8","pdf_url":null,"source":{"id":"https://openalex.org/S4306401271","display_name":"RePEc: Research Papers in Economics","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I77793887","host_organization_name":"Federal Reserve Bank of St. Louis","host_organization_lineage":["https://openalex.org/I77793887"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.7900000214576721}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W26591655","https://openalex.org/W40549020","https://openalex.org/W1614298861","https://openalex.org/W1982589161","https://openalex.org/W2059126410","https://openalex.org/W2078810130","https://openalex.org/W2250710744","https://openalex.org/W2272031392","https://openalex.org/W2273740070","https://openalex.org/W2399980089","https://openalex.org/W2591334920","https://openalex.org/W2735459586","https://openalex.org/W2735801230","https://openalex.org/W2741793919","https://openalex.org/W2750872979","https://openalex.org/W2763805348","https://openalex.org/W2765753216","https://openalex.org/W4285719527"],"related_works":["https://openalex.org/W2989490741","https://openalex.org/W138569904","https://openalex.org/W2367545121","https://openalex.org/W4248881655","https://openalex.org/W2482165163","https://openalex.org/W3010890513","https://openalex.org/W3092506759","https://openalex.org/W2390914021","https://openalex.org/W2389417819","https://openalex.org/W3195278891"],"abstract_inverted_index":null,"counts_by_year":[{"year":2026,"cited_by_count":6},{"year":2025,"cited_by_count":27},{"year":2024,"cited_by_count":24},{"year":2023,"cited_by_count":37},{"year":2022,"cited_by_count":25},{"year":2021,"cited_by_count":14},{"year":2020,"cited_by_count":5},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
