{"id":"https://openalex.org/W2095621640","doi":"https://doi.org/10.1017/s1351324914000102","title":"(Un/Semi-)supervised SMS text message SPAM detection","display_name":"(Un/Semi-)supervised SMS text message SPAM detection","publication_year":2014,"publication_date":"2014-10-15","ids":{"openalex":"https://openalex.org/W2095621640","doi":"https://doi.org/10.1017/s1351324914000102","mag":"2095621640"},"language":"en","primary_location":{"id":"doi:10.1017/s1351324914000102","is_oa":false,"landing_page_url":"https://doi.org/10.1017/s1351324914000102","pdf_url":null,"source":{"id":"https://openalex.org/S18088403","display_name":"Natural Language Engineering","issn_l":"1351-3249","issn":["1351-3249","1469-8110"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Natural Language Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5109906648","display_name":"Chris Giannella","orcid":"https://orcid.org/0000-0002-0118-8506"},"institutions":[{"id":"https://openalex.org/I4210118524","display_name":"Universit\u00e9 Bourgogne Franche-Comt\u00e9","ror":"https://ror.org/02dn7x778","country_code":"FR","type":"education","lineage":["https://openalex.org/I4210118524"]},{"id":"https://openalex.org/I44896327","display_name":"Mitre (United States)","ror":"https://ror.org/03ks2a131","country_code":"US","type":"company","lineage":["https://openalex.org/I44896327"]}],"countries":["FR","US"],"is_corresponding":true,"raw_author_name":"CHRIS R. GIANNELLA","raw_affiliation_strings":["The MITRE Corporation, 7515 Colshire Drive, McLean, VA 22102, USA","The MITRE Corporation 7515 Colshire Drive McLean, VA 22102, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"The MITRE Corporation, 7515 Colshire Drive, McLean, VA 22102, USA","institution_ids":["https://openalex.org/I44896327","https://openalex.org/I4210118524"]},{"raw_affiliation_string":"The MITRE Corporation 7515 Colshire Drive McLean, VA 22102, USA","institution_ids":["https://openalex.org/I44896327"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037018263","display_name":"Ransom K. Winder","orcid":null},"institutions":[{"id":"https://openalex.org/I4210118524","display_name":"Universit\u00e9 Bourgogne Franche-Comt\u00e9","ror":"https://ror.org/02dn7x778","country_code":"FR","type":"education","lineage":["https://openalex.org/I4210118524"]},{"id":"https://openalex.org/I44896327","display_name":"Mitre (United States)","ror":"https://ror.org/03ks2a131","country_code":"US","type":"company","lineage":["https://openalex.org/I44896327"]}],"countries":["FR","US"],"is_corresponding":false,"raw_author_name":"RANSOM WINDER","raw_affiliation_strings":["The MITRE Corporation, 7515 Colshire Drive, McLean, VA 22102, USA","The MITRE Corporation 7515 Colshire Drive McLean, VA 22102, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"The MITRE Corporation, 7515 Colshire Drive, McLean, VA 22102, USA","institution_ids":["https://openalex.org/I44896327","https://openalex.org/I4210118524"]},{"raw_affiliation_string":"The MITRE Corporation 7515 Colshire Drive McLean, VA 22102, USA","institution_ids":["https://openalex.org/I44896327"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5090580685","display_name":"Brandon Wilson","orcid":null},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"BRANDON WILSON","raw_affiliation_strings":["Department of Computer Science, University of Maryland, College Park, MD 20742, USA","Department of Computer Science, University of Maryland, College Park, MD 20742 USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Maryland, College Park, MD 20742, USA","institution_ids":["https://openalex.org/I66946132"]},{"raw_affiliation_string":"Department of Computer Science, University of Maryland, College Park, MD 20742 USA","institution_ids":["https://openalex.org/I66946132"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5109906648"],"corresponding_institution_ids":["https://openalex.org/I4210118524","https://openalex.org/I44896327"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.19140265,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"21","issue":"4","first_page":"553","last_page":"567"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11147","display_name":"Misinformation and Its Impacts","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9954000115394592,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8857501745223999},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.6761301755905151},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6540665626525879},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.594555139541626},{"id":"https://openalex.org/keywords/short-message-service","display_name":"Short Message Service","score":0.5928440690040588},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.5652347803115845},{"id":"https://openalex.org/keywords/naive-bayes-classifier","display_name":"Naive Bayes classifier","score":0.5147109627723694},{"id":"https://openalex.org/keywords/thresholding","display_name":"Thresholding","score":0.4977720081806183},{"id":"https://openalex.org/keywords/gibbs-sampling","display_name":"Gibbs sampling","score":0.4962814450263977},{"id":"https://openalex.org/keywords/supervised-learning","display_name":"Supervised learning","score":0.4613279402256012},{"id":"https://openalex.org/keywords/bag-of-words-model","display_name":"Bag-of-words model","score":0.4544456899166107},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.42840877175331116},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.38517117500305176}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8857501745223999},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.6761301755905151},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6540665626525879},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.594555139541626},{"id":"https://openalex.org/C74558129","wikidata":"https://www.wikidata.org/wiki/Q43024","display_name":"Short Message Service","level":2,"score":0.5928440690040588},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.5652347803115845},{"id":"https://openalex.org/C52001869","wikidata":"https://www.wikidata.org/wiki/Q812530","display_name":"Naive Bayes classifier","level":3,"score":0.5147109627723694},{"id":"https://openalex.org/C191178318","wikidata":"https://www.wikidata.org/wiki/Q2256906","display_name":"Thresholding","level":3,"score":0.4977720081806183},{"id":"https://openalex.org/C158424031","wikidata":"https://www.wikidata.org/wiki/Q1191905","display_name":"Gibbs sampling","level":3,"score":0.4962814450263977},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.4613279402256012},{"id":"https://openalex.org/C13672336","wikidata":"https://www.wikidata.org/wiki/Q3460803","display_name":"Bag-of-words model","level":2,"score":0.4544456899166107},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.42840877175331116},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.38517117500305176},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1017/s1351324914000102","is_oa":false,"landing_page_url":"https://doi.org/10.1017/s1351324914000102","pdf_url":null,"source":{"id":"https://openalex.org/S18088403","display_name":"Natural Language Engineering","issn_l":"1351-3249","issn":["1351-3249","1469-8110"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Natural Language Engineering","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W427701137","https://openalex.org/W1527313647","https://openalex.org/W1719067462","https://openalex.org/W1968955064","https://openalex.org/W1973644085","https://openalex.org/W1982302133","https://openalex.org/W1984457329","https://openalex.org/W1991804188","https://openalex.org/W2000369940","https://openalex.org/W2003798735","https://openalex.org/W2015585187","https://openalex.org/W2036166268","https://openalex.org/W2039724772","https://openalex.org/W2040717637","https://openalex.org/W2069128736","https://openalex.org/W2097381646","https://openalex.org/W2102889123","https://openalex.org/W2110357431","https://openalex.org/W2116330964","https://openalex.org/W2132957691","https://openalex.org/W2145376937","https://openalex.org/W2165698076","https://openalex.org/W2170207925","https://openalex.org/W2484412399","https://openalex.org/W2903158431","https://openalex.org/W3009557165","https://openalex.org/W6631531171","https://openalex.org/W6675315280","https://openalex.org/W6677180724","https://openalex.org/W6684836731"],"related_works":["https://openalex.org/W2953058328","https://openalex.org/W1542224353","https://openalex.org/W1661087619","https://openalex.org/W2750730210","https://openalex.org/W2116854923","https://openalex.org/W2125569632","https://openalex.org/W2185524891","https://openalex.org/W2249374134","https://openalex.org/W2611612779","https://openalex.org/W1989373866"],"abstract_inverted_index":{"Abstract":[0],"We":[1,17,89,147],"address":[2],"the":[3,30,43,46,57,91,101,107,119,132,139,149],"problem":[4],"of":[5,29,45,134],"unsupervised":[6,117],"and":[7,35,55,143,153],"semi-supervised":[8,105],"SMS":[9,47,69,77,97,159],"(Short":[10],"Message":[11],"Service)":[12],"text":[13],"message":[14,71],"SPAM":[15,80,160],"detection.":[16,161],"develop":[18],"a":[19,26,51,94,111,122,155],"content-based":[20],"Bayesian":[21],"classification":[22],"approach":[23,40,74,92,108,120,150],"which":[24],"is":[25,154],"modest":[27],"extension":[28],"technique":[31],"discussed":[32],"by":[33,60,84,138],"Resnik":[34],"Hardisty":[36],"in":[37,104,116],"2010.":[38],"The":[39,73],"assumes":[41],"that":[42],"bodies":[44],"messages":[48,78,136],"arise":[49],"from":[50,100],"probabilistic":[52],"generative":[53],"model":[54,58],"estimates":[56],"parameters":[59],"Gibbs":[61],"sampling":[62],"using":[63],"an":[64,126],"unlabeled,":[65],"or":[66,81],"partially":[67],"labeled,":[68],"training":[70,135],"corpus.":[72],"classifies":[75],"new":[76],"as":[79],"HAM":[82],"(non-SPAM)":[83],"zero-thresholding":[85],"their":[86],"logit":[87],"estimates.":[88],"tested":[90],"on":[93],"publicly":[95],"available":[96],"corpora":[98],"collected":[99],"UK.":[102],"Used":[103,115],"fashion,":[106,118],"clearly":[109],"outperformed":[110,121],"competing":[112],"algorithm,":[113],"Semi-Boost.":[114],"fully":[123],"supervised":[124],"classifier,":[125],"SVM":[127,140],"(Support":[128],"Vector":[129],"Machine),":[130],"when":[131],"number":[133],"used":[137],"was":[141],"small":[142],"performed":[144],"comparably":[145],"otherwise.":[146],"believe":[148],"works":[151],"well":[152],"useful":[156],"tool":[157],"for":[158]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":3}],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
