{"id":"https://openalex.org/W2568349553","doi":"https://doi.org/10.1177/0165551516684296","title":"Feature engineering for detecting spammers on Twitter: Modelling and analysis","display_name":"Feature engineering for detecting spammers on Twitter: Modelling and analysis","publication_year":2017,"publication_date":"2017-01-09","ids":{"openalex":"https://openalex.org/W2568349553","doi":"https://doi.org/10.1177/0165551516684296","mag":"2568349553"},"language":"en","primary_location":{"id":"doi:10.1177/0165551516684296","is_oa":false,"landing_page_url":"https://doi.org/10.1177/0165551516684296","pdf_url":null,"source":{"id":"https://openalex.org/S68913162","display_name":"Journal of Information Science","issn_l":"0165-5515","issn":["0165-5515","1741-6485"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Information Science","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5028116703","display_name":"Wafa Herzallah","orcid":null},"institutions":[{"id":"https://openalex.org/I114972647","display_name":"University of Jordan","ror":"https://ror.org/05k89ew48","country_code":"JO","type":"education","lineage":["https://openalex.org/I114972647"]}],"countries":["JO"],"is_corresponding":false,"raw_author_name":"Wafa Herzallah","raw_affiliation_strings":["Business Information Technology, King Abdullah II School of Information Technology, The University of Jordan, Jordan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Business Information Technology, King Abdullah II School of Information Technology, The University of Jordan, Jordan","institution_ids":["https://openalex.org/I114972647"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048560390","display_name":"Hossam Faris","orcid":"https://orcid.org/0000-0003-4261-8127"},"institutions":[{"id":"https://openalex.org/I114972647","display_name":"University of Jordan","ror":"https://ror.org/05k89ew48","country_code":"JO","type":"education","lineage":["https://openalex.org/I114972647"]}],"countries":["JO"],"is_corresponding":true,"raw_author_name":"Hossam Faris","raw_affiliation_strings":["Business Information Technology, King Abdullah II School of Information Technology, The University of Jordan, Jordan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Business Information Technology, King Abdullah II School of Information Technology, The University of Jordan, Jordan","institution_ids":["https://openalex.org/I114972647"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5087648541","display_name":"Omar Adwan","orcid":"https://orcid.org/0000-0003-3967-2456"},"institutions":[{"id":"https://openalex.org/I114972647","display_name":"University of Jordan","ror":"https://ror.org/05k89ew48","country_code":"JO","type":"education","lineage":["https://openalex.org/I114972647"]}],"countries":["JO"],"is_corresponding":false,"raw_author_name":"Omar Adwan","raw_affiliation_strings":["Business Information Technology, King Abdullah II School of Information Technology, The University of Jordan, Jordan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Business Information Technology, King Abdullah II School of Information Technology, The University of Jordan, Jordan","institution_ids":["https://openalex.org/I114972647"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5048560390"],"corresponding_institution_ids":["https://openalex.org/I114972647"],"apc_list":null,"apc_paid":null,"fwci":10.1255,"has_fulltext":false,"cited_by_count":55,"citation_normalized_percentile":{"value":0.98043808,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"44","issue":"2","first_page":"230","last_page":"247"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10400","display_name":"Network Security and Intrusion Detection","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/spamming","display_name":"Spamming","score":0.7863231897354126},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7617185711860657},{"id":"https://openalex.org/keywords/random-forest","display_name":"Random forest","score":0.669905960559845},{"id":"https://openalex.org/keywords/naive-bayes-classifier","display_name":"Naive Bayes classifier","score":0.6603379249572754},{"id":"https://openalex.org/keywords/popularity","display_name":"Popularity","score":0.6031215190887451},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5645826458930969},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5365415215492249},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.5208028554916382},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5091597437858582},{"id":"https://openalex.org/keywords/phishing","display_name":"Phishing","score":0.49569642543792725},{"id":"https://openalex.org/keywords/multilayer-perceptron","display_name":"Multilayer perceptron","score":0.4764730930328369},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4726482927799225},{"id":"https://openalex.org/keywords/social-media","display_name":"Social media","score":0.4355514645576477},{"id":"https://openalex.org/keywords/social-network-analysis","display_name":"Social network analysis","score":0.42487892508506775},{"id":"https://openalex.org/keywords/perceptron","display_name":"Perceptron","score":0.4182452857494354},{"id":"https://openalex.org/keywords/data-set","display_name":"Data set","score":0.4130912125110626},{"id":"https://openalex.org/keywords/feature-engineering","display_name":"Feature engineering","score":0.4123413562774658},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4027150571346283},{"id":"https://openalex.org/keywords/the-internet","display_name":"The Internet","score":0.3382086157798767},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.21817851066589355},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.10714873671531677}],"concepts":[{"id":"https://openalex.org/C158955206","wikidata":"https://www.wikidata.org/wiki/Q83058","display_name":"Spamming","level":3,"score":0.7863231897354126},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7617185711860657},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.669905960559845},{"id":"https://openalex.org/C52001869","wikidata":"https://www.wikidata.org/wiki/Q812530","display_name":"Naive Bayes classifier","level":3,"score":0.6603379249572754},{"id":"https://openalex.org/C2780586970","wikidata":"https://www.wikidata.org/wiki/Q1357284","display_name":"Popularity","level":2,"score":0.6031215190887451},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5645826458930969},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5365415215492249},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.5208028554916382},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5091597437858582},{"id":"https://openalex.org/C83860907","wikidata":"https://www.wikidata.org/wiki/Q135005","display_name":"Phishing","level":3,"score":0.49569642543792725},{"id":"https://openalex.org/C179717631","wikidata":"https://www.wikidata.org/wiki/Q2991667","display_name":"Multilayer perceptron","level":3,"score":0.4764730930328369},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4726482927799225},{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.4355514645576477},{"id":"https://openalex.org/C114713312","wikidata":"https://www.wikidata.org/wiki/Q7551269","display_name":"Social network analysis","level":3,"score":0.42487892508506775},{"id":"https://openalex.org/C60908668","wikidata":"https://www.wikidata.org/wiki/Q690207","display_name":"Perceptron","level":3,"score":0.4182452857494354},{"id":"https://openalex.org/C58489278","wikidata":"https://www.wikidata.org/wiki/Q1172284","display_name":"Data set","level":2,"score":0.4130912125110626},{"id":"https://openalex.org/C2778827112","wikidata":"https://www.wikidata.org/wiki/Q22245680","display_name":"Feature engineering","level":3,"score":0.4123413562774658},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4027150571346283},{"id":"https://openalex.org/C110875604","wikidata":"https://www.wikidata.org/wiki/Q75","display_name":"The Internet","level":2,"score":0.3382086157798767},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.21817851066589355},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.10714873671531677},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1177/0165551516684296","is_oa":false,"landing_page_url":"https://doi.org/10.1177/0165551516684296","pdf_url":null,"source":{"id":"https://openalex.org/S68913162","display_name":"Journal of Information Science","issn_l":"0165-5515","issn":["0165-5515","1741-6485"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Information Science","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W196350606","https://openalex.org/W1604938182","https://openalex.org/W2021191744","https://openalex.org/W2073756733","https://openalex.org/W2087576375","https://openalex.org/W2088080849","https://openalex.org/W2110357431","https://openalex.org/W2130486630","https://openalex.org/W2133990480","https://openalex.org/W2136971460","https://openalex.org/W2157894025","https://openalex.org/W2158568356","https://openalex.org/W2286513919","https://openalex.org/W2409135246","https://openalex.org/W2911964244","https://openalex.org/W2912652079","https://openalex.org/W4205199542","https://openalex.org/W4249968242","https://openalex.org/W4253251754","https://openalex.org/W4254211903","https://openalex.org/W6600651459"],"related_works":["https://openalex.org/W1987732684","https://openalex.org/W2286465138","https://openalex.org/W637393809","https://openalex.org/W2808742736","https://openalex.org/W1526983901","https://openalex.org/W3126526144","https://openalex.org/W3021299372","https://openalex.org/W2492910442","https://openalex.org/W2255926860","https://openalex.org/W2901744059"],"abstract_inverted_index":{"Twitter":[0,23],"is":[1,91,118,131],"a":[2,9,24,70,128],"social":[3,250],"networking":[4],"website":[5],"that":[6,55,74,138,188],"has":[7],"gained":[8],"lot":[10],"of":[11,115,145,159,190,214,220,225,233,245],"popularity":[12,21],"around":[13],"the":[14,17,45,51,62,136,143,182,191,200,211,218,221,226,234,237,243,249],"world":[15],"in":[16,61,205,242,248],"last":[18],"decade.":[19],"This":[20],"made":[22],"common":[25],"target":[26],"for":[27,58,155],"spammers":[28,247],"and":[29,37,82,109,120,153,167,236],"malicious":[30],"users":[31],"to":[32,49,68,78,134,180],"spread":[33],"unwanted":[34],"advertisements,":[35],"viruses":[36],"phishing":[38],"attacks.":[39],"In":[40],"this":[41,156,206],"article,":[42],"we":[43],"review":[44],"latest":[46],"research":[47],"works":[48],"determine":[50],"most":[52,189],"effective":[53],"features":[54,65,137,172,216],"were":[56],"investigated":[57],"spam":[59,146],"detection":[60,85,183],"literature.":[63],"These":[64],"are":[66,151,177],"collected":[67],"build":[69,181],"comprehensive":[71,201],"data":[72,89,202],"set":[73,90,203],"can":[75],"be":[76],"used":[77,152,178],"develop":[79],"more":[80],"robust":[81],"accurate":[83],"spammer":[84],"models.":[86,184],"The":[87,112],"new":[88],"tested":[92],"using":[93],"popular":[94],"classifiers":[95,117,193],"(Naive":[96],"Bayes,":[97],"support":[98],"vector":[99],"machines,":[100],"multilayer":[101],"perceptron":[102],"neural":[103],"networks,":[104],"Decision":[105],"Trees,":[106],"Random":[107],"forests":[108],"k-Nearest":[110],"Neighbour).":[111],"prediction":[113],"performance":[114],"these":[116],"evaluated":[119],"compared":[121,154],"based":[122,198],"on":[123,142,199],"different":[124,149],"evaluation":[125,196],"metrics.":[126],"Moreover,":[127],"further":[129],"analysis":[130],"carried":[132],"out":[133],"identify":[135],"have":[139],"higher":[140],"impact":[141],"accuracy":[144],"detection.":[147],"Three":[148],"techniques":[150],"analysis:":[157],"change":[158],"mean":[160],"square":[161],"error":[162],"(CoM),":[163],"information":[164],"gain":[165],"(IG)":[166],"Relief-F":[168],"method.":[169],"Top":[170],"five":[171],"identified":[173],"by":[174],"each":[175],"technique":[176],"again":[179],"Experimental":[185],"results":[186,197],"show":[187],"developed":[192],"obtained":[194],"high":[195],"constructed":[204],"work.":[207],"Experiments":[208],"also":[209],"reveal":[210],"important":[212],"role":[213],"some":[215],"like":[217],"reputation":[219],"account,":[222,235],"average":[223,228,238],"length":[224],"tweet,":[227,231],"mention":[229],"per":[230],"age":[232],"time":[239],"between":[240],"posts":[241],"process":[244],"identifying":[246],"network.":[251]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":7},{"year":2022,"cited_by_count":8},{"year":2021,"cited_by_count":13},{"year":2020,"cited_by_count":6},{"year":2019,"cited_by_count":10},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":2}],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
