{"id":"https://openalex.org/W4283446311","doi":"https://doi.org/10.1145/3533050.3533063","title":"N-Gram-Based Machine Learning Approach for Bot or Human Detection from Text Messages","display_name":"N-Gram-Based Machine Learning Approach for Bot or Human Detection from Text Messages","publication_year":2022,"publication_date":"2022-04-09","ids":{"openalex":"https://openalex.org/W4283446311","doi":"https://doi.org/10.1145/3533050.3533063"},"language":"en","primary_location":{"id":"doi:10.1145/3533050.3533063","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3533050.3533063","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2022 6th International Conference on Intelligent Systems, Metaheuristics &amp; Swarm Intelligence","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5030845592","display_name":"Durga Prasad Kavadi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Durga Prasad Kavadi","raw_affiliation_strings":["Department of Artificial Intelligence and Machine Learning, B V Raju Institute of Technology, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Artificial Intelligence and Machine Learning, B V Raju Institute of Technology, India","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057792870","display_name":"Chandra Sekhar Sanaboina","orcid":"https://orcid.org/0000-0002-3180-2036"},"institutions":[{"id":"https://openalex.org/I142809039","display_name":"Jawaharlal Nehru Technological University, Kakinada","ror":"https://ror.org/05s9t8c95","country_code":"IN","type":"education","lineage":["https://openalex.org/I142809039"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Chandra Sekhar Sanaboina","raw_affiliation_strings":["Department of Computer Science and Engineering, Jawaharlal Nehru Technological University Kakinada, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Jawaharlal Nehru Technological University Kakinada, India","institution_ids":["https://openalex.org/I142809039"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050142015","display_name":"Rizwan Patan","orcid":"https://orcid.org/0000-0003-4878-1988"},"institutions":[{"id":"https://openalex.org/I172980758","display_name":"Kennesaw State University","ror":"https://ror.org/00jeqjx33","country_code":"US","type":"education","lineage":["https://openalex.org/I172980758"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Rizwan Patan","raw_affiliation_strings":["Department of Software Engineering &amp; Game Development, Kennesaw State University, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Software Engineering &amp; Game Development, Kennesaw State University, USA","institution_ids":["https://openalex.org/I172980758"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5039341855","display_name":"Amir H. Gandomi","orcid":"https://orcid.org/0000-0002-2798-0104"},"institutions":[{"id":"https://openalex.org/I114017466","display_name":"University of Technology Sydney","ror":"https://ror.org/03f0f6041","country_code":"AU","type":"education","lineage":["https://openalex.org/I114017466"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Amir Gandomi","raw_affiliation_strings":["Faculty of Engineering &amp; Information Technology, University of Technology Sydney, Australia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Engineering &amp; Information Technology, University of Technology Sydney, Australia","institution_ids":["https://openalex.org/I114017466"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.10702877,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"80","last_page":"85"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11147","display_name":"Misinformation and Its Impacts","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7961841225624084},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6318532228469849},{"id":"https://openalex.org/keywords/n-gram","display_name":"n-gram","score":0.5751276016235352},{"id":"https://openalex.org/keywords/random-forest","display_name":"Random forest","score":0.5513659119606018},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.5341692566871643},{"id":"https://openalex.org/keywords/feature-selection","display_name":"Feature selection","score":0.5335866212844849},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.491610586643219},{"id":"https://openalex.org/keywords/malware","display_name":"Malware","score":0.4901359975337982},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.48290061950683594},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.4734346866607666},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.44717171788215637},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.37632179260253906},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.34724438190460205},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.2572707533836365}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7961841225624084},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6318532228469849},{"id":"https://openalex.org/C117884012","wikidata":"https://www.wikidata.org/wiki/Q94489","display_name":"n-gram","level":3,"score":0.5751276016235352},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.5513659119606018},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.5341692566871643},{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.5335866212844849},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.491610586643219},{"id":"https://openalex.org/C541664917","wikidata":"https://www.wikidata.org/wiki/Q14001","display_name":"Malware","level":2,"score":0.4901359975337982},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.48290061950683594},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.4734346866607666},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.44717171788215637},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.37632179260253906},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.34724438190460205},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.2572707533836365},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3533050.3533063","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3533050.3533063","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2022 6th International Conference on Intelligent Systems, Metaheuristics &amp; Swarm Intelligence","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.46000000834465027,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W1560724230","https://openalex.org/W1586444875","https://openalex.org/W1837843568","https://openalex.org/W2013208103","https://openalex.org/W2072715695","https://openalex.org/W2092277251","https://openalex.org/W2140321362","https://openalex.org/W2165612380","https://openalex.org/W2263846226","https://openalex.org/W2510717748","https://openalex.org/W2549201775","https://openalex.org/W2911964244","https://openalex.org/W2964659200","https://openalex.org/W2965968305","https://openalex.org/W2965987121","https://openalex.org/W2966262219","https://openalex.org/W2966317983","https://openalex.org/W3097132272","https://openalex.org/W3125182500","https://openalex.org/W4206005644","https://openalex.org/W4239510810"],"related_works":["https://openalex.org/W2097492617","https://openalex.org/W2753240997","https://openalex.org/W1764168690","https://openalex.org/W4388745254","https://openalex.org/W2889302474","https://openalex.org/W2980082554","https://openalex.org/W1517228774","https://openalex.org/W2767419625","https://openalex.org/W2389704471","https://openalex.org/W2068663901"],"abstract_inverted_index":{"Social":[0],"bots":[1,19],"are":[2,86,93,151,177],"computer":[3],"programs":[4],"created":[5],"for":[6,71,212],"automating":[7],"general":[8],"human":[9,75],"activities":[10,28],"like":[11,33],"the":[12,42,55,59,130,154,158,164,181,192,207],"generation":[13],"of":[14,18,38,41,61,80,107,119,129,145,160,210],"messages.":[15],"The":[16,77,88,116,134,186,202],"rise":[17],"in":[20,49,96,153,163,195],"social":[21,50],"network":[22],"platforms":[23,52],"has":[24],"led":[25],"to":[26,53,58,101,156,179,191],"malicious":[27],"such":[29],"as":[30,138],"content":[31],"pollution":[32],"spammers":[34],"or":[35,74],"malware":[36],"dissemination":[37],"misinformation.":[39],"Most":[40],"researchers":[43],"focused":[44],"on":[45],"detecting":[46],"bot":[47,73,199],"accounts":[48],"media":[51],"avoid":[54],"damages":[56],"done":[57],"opinions":[60],"users.":[62],"In":[63],"this":[64],"work,":[65],"n-gram":[66],"based":[67],"approach":[68,188],"is":[69,109,121,136],"proposed":[70,187],"a":[72,125,142],"detection.":[76,214],"content-based":[78],"features":[79,120,162],"character":[81,89],"n-grams":[82,85,92,108,161],"and":[83,90,174],"word":[84,91],"used.":[87],"successfully":[94],"proved":[95],"various":[97],"authorship":[98],"analysis":[99],"tasks":[100],"improve":[102],"accuracy.":[103],"A":[104],"huge":[105],"number":[106],"identified":[110],"after":[111],"applying":[112],"different":[113],"pre-processing":[114],"techniques.":[115],"high":[117],"dimensionality":[118],"reduced":[122,143],"by":[123,140],"using":[124,141,183],"feature":[126],"selection":[127],"technique":[128],"Relevant":[131],"Discrimination":[132],"Criterion.":[133],"text":[135],"represented":[137],"vectors":[139],"set":[144],"features.":[146],"Different":[147],"term":[148],"weight":[149,159],"measures":[150],"used":[152,178],"experiment":[155],"compute":[157],"document":[165,184],"vector":[166],"representation.":[167],"Two":[168],"classification":[169],"algorithms,":[170],"Support":[171],"Vector":[172],"Machine,":[173],"Random":[175,203],"Forest":[176,204],"train":[180],"model":[182],"vectors.":[185],"was":[189],"applied":[190],"dataset":[193],"provided":[194],"PAN":[196],"2019":[197],"competition":[198],"detection":[200],"task.":[201],"classifier":[205],"obtained":[206],"best":[208],"accuracy":[209],"0.9456":[211],"bot/human":[213]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
