{"id":"https://openalex.org/W4297970707","doi":"https://doi.org/10.1561/1500000006","title":"Email Spam Filtering: A Systematic Review","display_name":"Email Spam Filtering: A Systematic Review","publication_year":2008,"publication_date":"2008-06-23","ids":{"openalex":"https://openalex.org/W4297970707","doi":"https://doi.org/10.1561/1500000006"},"language":"en","primary_location":{"id":"doi:10.1561/1500000006","is_oa":false,"landing_page_url":"https://doi.org/10.1561/1500000006","pdf_url":null,"source":{"id":"https://openalex.org/S197106261","display_name":"Foundations and Trends\u00ae in Information Retrieval","issn_l":"1554-0669","issn":["1554-0669","1554-0677"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310318575","host_organization_name":"Now Publishers","host_organization_lineage":["https://openalex.org/P4310318575"],"host_organization_lineage_names":["Now Publishers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Foundations and Trends\u00ae in Information Retrieval","raw_type":"journal-article"},"type":"review","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5084091807","display_name":"Gordon V. Cormack","orcid":"https://orcid.org/0000-0002-5890-0293"},"institutions":[{"id":"https://openalex.org/I151746483","display_name":"University of Waterloo","ror":"https://ror.org/01aff2v68","country_code":"CA","type":"education","lineage":["https://openalex.org/I151746483"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"Gordon V. Cormack","raw_affiliation_strings":["David R. Cheriton School of Computer Science, University of Waterloo,Waterloo , Ontario, N2L 3G1,","David R. Cheriton School of Computer Science, University of Waterloo, Canada"],"affiliations":[{"raw_affiliation_string":"David R. Cheriton School of Computer Science, University of Waterloo,Waterloo , Ontario, N2L 3G1,","institution_ids":["https://openalex.org/I151746483"]},{"raw_affiliation_string":"David R. Cheriton School of Computer Science, University of Waterloo, Canada","institution_ids":["https://openalex.org/I151746483"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5084091807"],"corresponding_institution_ids":["https://openalex.org/I151746483"],"apc_list":null,"apc_paid":null,"fwci":20.9947,"has_fulltext":false,"cited_by_count":248,"citation_normalized_percentile":{"value":0.99222448,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":"1","issue":"4","first_page":"335","last_page":"455"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12607","display_name":"Personal Information Management and User Behavior","score":0.9584000110626221,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11045","display_name":"Privacy, Security, and Data Protection","score":0.9549999833106995,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5625355839729309},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.48812946677207947},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.3504600524902344}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5625355839729309},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.48812946677207947},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.3504600524902344}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1561/1500000006","is_oa":false,"landing_page_url":"https://doi.org/10.1561/1500000006","pdf_url":null,"source":{"id":"https://openalex.org/S197106261","display_name":"Foundations and Trends\u00ae in Information Retrieval","issn_l":"1554-0669","issn":["1554-0669","1554-0677"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310318575","host_organization_name":"Now Publishers","host_organization_lineage":["https://openalex.org/P4310318575"],"host_organization_lineage_names":["Now Publishers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Foundations and Trends\u00ae in Information Retrieval","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W1480484573","https://openalex.org/W1586405805","https://openalex.org/W1965272602","https://openalex.org/W1966026565","https://openalex.org/W2000369940","https://openalex.org/W2015824828","https://openalex.org/W2029551688","https://openalex.org/W2035210366","https://openalex.org/W2042961901","https://openalex.org/W2058737869","https://openalex.org/W2062614982","https://openalex.org/W2092926517","https://openalex.org/W2093555915","https://openalex.org/W2099606292","https://openalex.org/W2108313281","https://openalex.org/W2111310810","https://openalex.org/W2116091861","https://openalex.org/W2118020653","https://openalex.org/W2120189271","https://openalex.org/W2126416132","https://openalex.org/W2126576175","https://openalex.org/W2134208562","https://openalex.org/W2137012911","https://openalex.org/W2140785063","https://openalex.org/W2140821974","https://openalex.org/W2142863739","https://openalex.org/W2161628678","https://openalex.org/W2163294786","https://openalex.org/W2166490929","https://openalex.org/W2169075655","https://openalex.org/W2169384781","https://openalex.org/W2912934387","https://openalex.org/W3102372265","https://openalex.org/W4237411492","https://openalex.org/W4242807147","https://openalex.org/W4244952642"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W2382290278","https://openalex.org/W2350741829","https://openalex.org/W2530322880","https://openalex.org/W1596801655","https://openalex.org/W2359140296"],"abstract_inverted_index":{"Spam":[0],"is":[1,21,45,54,188,260],"information":[2,136,228,245],"crafted":[3,167],"to":[4,7,25,30,70,80,252,264,324,333,349],"be":[5,112,131,157,162],"delivered":[6],"a":[8,52,87,122,241],"large":[9,242],"number":[10],"of":[11,15,36,63,73,117,125,224,233,240,308,327,336],"recipients,":[12],"in":[13,191,199,277,311],"spite":[14,307],"their":[16,68,160,301,304],"wishes.":[17],"A":[18,82],"spam":[19,27,37,39,44,103,174,189,197,235,292,328,337],"filter":[20,53,236,338],"an":[22],"automated":[23],"tool":[24],"recognize":[26],"so":[28,219],"as":[29,207,237,285,323,332],"prevent":[31],"its":[32],"delivery.":[33],"The":[34,60],"purposes":[35],"and":[38,75,119,138,172,194,202,210,230,243,273,288,303,331,345],"filters":[40,104,293],"are":[41,105,147,152,214,249,282,294],"diametrically":[42],"opposed:":[43],"effective":[46,55,109,128,149],"if":[47,56],"it":[48,57,96],"evades":[49],"filters,":[50],"while":[51],"recognizes":[58],"spam.":[59,265],"circular":[61],"nature":[62],"these":[64,299],"definitions,":[65],"along":[66],"with":[67,177,196],"appeal":[69],"the":[71,115,134,211,222,226,231,234,254,258,325,334],"intent":[72],"sender":[74],"recipient":[76],"make":[77,253],"them":[78],"difficult":[79],"formalize.":[81],"typical":[83],"email":[84],"user":[85],"has":[86],"working":[88],"definition":[89,124,223],"no":[90],"more":[91,108,127,165],"formal":[92,123],"than":[93,110,129],"\"I":[94],"know":[95],"when":[97],"I":[98],"see":[99],"it.\"":[100],"Yet,":[101],"current":[102,171],"remarkably":[106],"effective,":[107],"might":[111,130,155],"expected":[113,132],"given":[114,133],"level":[116],"uncertainty":[118],"debate":[120],"over":[121],"spam,":[126,225],"state-of-the-art":[135],"retrieval":[137],"machine":[139],"learning":[140],"methods":[141,248,289,348],"for":[142,275,290],"seemingly":[143],"similar":[144],"problems.":[145],"But":[146],"they":[148,156,183],"enough?":[150],"Which":[151],"better?":[153],"How":[154],"improved?":[158],"Will":[159],"effectiveness":[161,326],"compromised":[163],"by":[164],"cleverly":[166],"spam?":[168],"We":[169,297,341],"survey":[170,298],"proposed":[173],"filtering":[175,190,198,329],"techniques":[176,330],"particular":[178],"emphasis":[179],"on":[180,261],"how":[181],"well":[182],"work.":[184],"Our":[185],"primary":[186],"focus":[187,259],"email;":[192],"Similarities":[193],"differences":[195,276],"other":[200],"communication":[201],"storage":[203],"media":[204],"\u2014":[205,213],"such":[206],"instant":[208],"messaging":[209],"Web":[212],"addressed":[215],"peripherally.":[216],"In":[217,306],"doing":[218],"we":[220],"examine":[221],"user\u2019s":[227],"requirements":[229],"role":[232],"one":[238],"component":[239],"complex":[244],"universe.":[246],"Well-known":[247],"detailed":[250],"sufficiently":[251],"exposition":[255],"self-contained,":[256],"however,":[257],"considerations":[262],"unique":[263],"Comparisons,":[266],"wherever":[267],"possible,":[268],"use":[269],"common":[270],"evaluation":[271,312,339],"measures,":[272,287],"control":[274],"experimental":[278,347],"setup.":[279],"Such":[280],"comparisons":[281],"not":[283],"easy,":[284],"benchmarks,":[286],"evaluating":[291],"still":[295],"evolving.":[296],"efforts,":[300],"results":[302],"limitations.":[305],"recent":[309],"advances":[310],"methodology,":[313],"many":[314],"uncertainties":[315,344],"(including":[316],"widely":[317],"held":[318],"but":[319],"unsubstantiated":[320],"beliefs)":[321],"remain":[322],"validity":[335],"methods.":[340],"outline":[342],"several":[343],"propose":[346],"address":[350],"them.":[351]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":17},{"year":2024,"cited_by_count":40},{"year":2023,"cited_by_count":10},{"year":2022,"cited_by_count":7},{"year":2021,"cited_by_count":11},{"year":2020,"cited_by_count":22},{"year":2019,"cited_by_count":15},{"year":2018,"cited_by_count":19},{"year":2017,"cited_by_count":14},{"year":2016,"cited_by_count":16},{"year":2015,"cited_by_count":12},{"year":2014,"cited_by_count":13},{"year":2013,"cited_by_count":8},{"year":2012,"cited_by_count":18}],"updated_date":"2026-04-04T06:10:10.580331","created_date":"2025-10-10T00:00:00"}
