{"id":"https://openalex.org/W2154586245","doi":"https://doi.org/10.1145/1526709.1526786","title":"A hybrid phish detection approach by identity discovery and keywords retrieval","display_name":"A hybrid phish detection approach by identity discovery and keywords retrieval","publication_year":2009,"publication_date":"2009-04-20","ids":{"openalex":"https://openalex.org/W2154586245","doi":"https://doi.org/10.1145/1526709.1526786","mag":"2154586245"},"language":"en","primary_location":{"id":"doi:10.1145/1526709.1526786","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1526709.1526786","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 18th international conference on World wide web","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5029285921","display_name":"Guang Xiang","orcid":null},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Guang Xiang","raw_affiliation_strings":["Carnegie Mellon University, Pittsburgh, PA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University, Pittsburgh, PA, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5090310268","display_name":"Jason Hong","orcid":"https://orcid.org/0000-0002-9856-9654"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jason I. Hong","raw_affiliation_strings":["Carnegie Mellon University, Pittsburgh, PA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University, Pittsburgh, PA, USA","institution_ids":["https://openalex.org/I74973139"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5029285921"],"corresponding_institution_ids":["https://openalex.org/I74973139"],"apc_list":null,"apc_paid":null,"fwci":21.7385,"has_fulltext":false,"cited_by_count":115,"citation_normalized_percentile":{"value":0.99239819,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"571","last_page":"580"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/phishing","display_name":"Phishing","score":0.7970236539840698},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7661093473434448},{"id":"https://openalex.org/keywords/identity","display_name":"Identity (music)","score":0.6250092387199402},{"id":"https://openalex.org/keywords/false-positive-rate","display_name":"False positive rate","score":0.5016272068023682},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.49993181228637695},{"id":"https://openalex.org/keywords/component","display_name":"Component (thermodynamics)","score":0.45922982692718506},{"id":"https://openalex.org/keywords/the-internet","display_name":"The Internet","score":0.44159799814224243},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3413316011428833},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.23669040203094482},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.199225515127182}],"concepts":[{"id":"https://openalex.org/C83860907","wikidata":"https://www.wikidata.org/wiki/Q135005","display_name":"Phishing","level":3,"score":0.7970236539840698},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7661093473434448},{"id":"https://openalex.org/C2778355321","wikidata":"https://www.wikidata.org/wiki/Q17079427","display_name":"Identity (music)","level":2,"score":0.6250092387199402},{"id":"https://openalex.org/C95922358","wikidata":"https://www.wikidata.org/wiki/Q5432725","display_name":"False positive rate","level":2,"score":0.5016272068023682},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.49993181228637695},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.45922982692718506},{"id":"https://openalex.org/C110875604","wikidata":"https://www.wikidata.org/wiki/Q75","display_name":"The Internet","level":2,"score":0.44159799814224243},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3413316011428833},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.23669040203094482},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.199225515127182},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/1526709.1526786","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1526709.1526786","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 18th international conference on World wide web","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.170.3138","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.170.3138","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.cs.cmu.edu/%7Ejasonh/publications/www2009-phish-detection-ner-ir-final.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320338281","display_name":"Army Research Office","ror":"https://ror.org/05epdh915"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":8,"referenced_works":["https://openalex.org/W192036632","https://openalex.org/W215137156","https://openalex.org/W1593211785","https://openalex.org/W2010608681","https://openalex.org/W2053774863","https://openalex.org/W2139565456","https://openalex.org/W2144578941","https://openalex.org/W2147495097"],"related_works":["https://openalex.org/W2149202530","https://openalex.org/W2807822918","https://openalex.org/W2921723332","https://openalex.org/W2482950156","https://openalex.org/W4396966040","https://openalex.org/W2305322260","https://openalex.org/W3139248031","https://openalex.org/W3042334625","https://openalex.org/W4200017362","https://openalex.org/W4388020458"],"abstract_inverted_index":{"Phishing":[0],"is":[1,92],"a":[2,21,106,120,130,137],"significant":[3],"security":[4],"threat":[5],"to":[6,72,94,97],"the":[7,49,55,67,126],"Internet,":[8],"which":[9],"causes":[10],"tremendous":[11],"economic":[12],"loss":[13],"every":[14],"year.":[15],"In":[16],"this":[17],"paper,":[18],"we":[19],"proposed":[20],"novel":[22],"hybrid":[23],"phish":[24],"detection":[25],"method":[26,42,76],"based":[27],"on":[28],"information":[29,33],"extraction":[30],"(IE)":[31],"and":[32,54,87,90,125],"retrieval":[34],"(IR)":[35],"techniques.":[36],"The":[37,60],"identity-based":[38],"component":[39,62],"of":[40,69,84,109,134,141],"our":[41],"detects":[43],"phishing":[44,85,101],"webpages":[45],"by":[46],"directly":[47],"discovering":[48],"inconsistency":[50],"between":[51],"their":[52],"identity":[53,56],"they":[57],"are":[58],"imitating.":[59],"keywords-retrieval":[61],"utilizes":[63],"IR":[64],"algorithms":[65],"exploiting":[66],"power":[68],"search":[70],"engines":[71],"identify":[73],"phish.":[74],"Our":[75],"requires":[77],"no":[78,81],"training":[79],"data,":[80],"prior":[82],"knowledge":[83],"signatures":[86],"specific":[88],"implementations,":[89],"thus":[91],"able":[93],"adapt":[95],"quickly":[96],"constantly":[98],"appearing":[99],"new":[100],"patterns.":[102],"Comprehensive":[103],"experiments":[104],"over":[105],"diverse":[107],"spectrum":[108],"data":[110],"sources":[111],"with":[112,136],"11449":[113],"pages":[114],"show":[115],"that":[116],"both":[117],"components":[118],"have":[119],"low":[121],"false":[122,138],"positive":[123,132,139],"rate":[124,133,140],"stacked":[127],"approach":[128],"achieves":[129],"true":[131],"90.06%":[135],"1.95%.":[142]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":7},{"year":2019,"cited_by_count":6},{"year":2018,"cited_by_count":6},{"year":2017,"cited_by_count":10},{"year":2016,"cited_by_count":10},{"year":2015,"cited_by_count":13},{"year":2014,"cited_by_count":11},{"year":2013,"cited_by_count":10},{"year":2012,"cited_by_count":7}],"updated_date":"2026-04-28T14:05:53.105641","created_date":"2025-10-10T00:00:00"}
