{"id":"https://openalex.org/W2035621475","doi":"https://doi.org/10.1145/1326561.1326565","title":"Detecting splogs via temporal dynamics using self-similarity analysis","display_name":"Detecting splogs via temporal dynamics using self-similarity analysis","publication_year":2008,"publication_date":"2008-02-01","ids":{"openalex":"https://openalex.org/W2035621475","doi":"https://doi.org/10.1145/1326561.1326565","mag":"2035621475"},"language":"en","primary_location":{"id":"doi:10.1145/1326561.1326565","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1326561.1326565","pdf_url":null,"source":{"id":"https://openalex.org/S131231701","display_name":"ACM Transactions on the Web","issn_l":"1559-1131","issn":["1559-1131","1559-114X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on the Web","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5042159546","display_name":"Yu\u2010Ru Lin","orcid":"https://orcid.org/0000-0002-8497-3015"},"institutions":[{"id":"https://openalex.org/I55732556","display_name":"Arizona State University","ror":"https://ror.org/03efmqc40","country_code":"US","type":"education","lineage":["https://openalex.org/I55732556"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Yu-Ru Lin","raw_affiliation_strings":["Arizona State University, AZ","Arizona State University, AZ#TAB#"],"affiliations":[{"raw_affiliation_string":"Arizona State University, AZ","institution_ids":["https://openalex.org/I55732556"]},{"raw_affiliation_string":"Arizona State University, AZ#TAB#","institution_ids":["https://openalex.org/I55732556"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018532037","display_name":"Hari Sundaram","orcid":"https://orcid.org/0000-0003-3315-6055"},"institutions":[{"id":"https://openalex.org/I55732556","display_name":"Arizona State University","ror":"https://ror.org/03efmqc40","country_code":"US","type":"education","lineage":["https://openalex.org/I55732556"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hari Sundaram","raw_affiliation_strings":["Arizona State University, AZ","Arizona State University, AZ#TAB#"],"affiliations":[{"raw_affiliation_string":"Arizona State University, AZ","institution_ids":["https://openalex.org/I55732556"]},{"raw_affiliation_string":"Arizona State University, AZ#TAB#","institution_ids":["https://openalex.org/I55732556"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075969864","display_name":"Y\u00fcn Chi","orcid":"https://orcid.org/0000-0002-8441-3974"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yun Chi","raw_affiliation_strings":["NEC Laboratories America, Cupertino, CA"],"affiliations":[{"raw_affiliation_string":"NEC Laboratories America, Cupertino, CA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088763786","display_name":"Junichi Tatemura","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Junichi Tatemura","raw_affiliation_strings":["NEC Laboratories America, Cupertino, CA"],"affiliations":[{"raw_affiliation_string":"NEC Laboratories America, Cupertino, CA","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5112455964","display_name":"Belle L. Tseng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Belle L. Tseng","raw_affiliation_strings":["NEC Laboratories America, Cupertino, CA"],"affiliations":[{"raw_affiliation_string":"NEC Laboratories America, Cupertino, CA","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5042159546"],"corresponding_institution_ids":["https://openalex.org/I55732556"],"apc_list":null,"apc_paid":null,"fwci":8.4311,"has_fulltext":false,"cited_by_count":50,"citation_normalized_percentile":{"value":0.98324827,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"2","issue":"1","first_page":"1","last_page":"35"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10064","display_name":"Complex Network Analysis Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10064","display_name":"Complex Network Analysis Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7695480585098267},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.5848814249038696},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5422864556312561},{"id":"https://openalex.org/keywords/curse-of-dimensionality","display_name":"Curse of dimensionality","score":0.5306474566459656},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.48532575368881226},{"id":"https://openalex.org/keywords/histogram","display_name":"Histogram","score":0.4673752188682556},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.4574034512042999},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4401562213897705},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.42585447430610657},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.39235955476760864},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.1753239631652832}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7695480585098267},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.5848814249038696},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5422864556312561},{"id":"https://openalex.org/C111030470","wikidata":"https://www.wikidata.org/wiki/Q1430460","display_name":"Curse of dimensionality","level":2,"score":0.5306474566459656},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.48532575368881226},{"id":"https://openalex.org/C53533937","wikidata":"https://www.wikidata.org/wiki/Q185020","display_name":"Histogram","level":3,"score":0.4673752188682556},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.4574034512042999},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4401562213897705},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.42585447430610657},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.39235955476760864},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.1753239631652832},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/1326561.1326565","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1326561.1326565","pdf_url":null,"source":{"id":"https://openalex.org/S131231701","display_name":"ACM Transactions on the Web","issn_l":"1559-1131","issn":["1559-1131","1559-114X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on the Web","raw_type":"journal-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.139.8193","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.139.8193","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.nec-labs.com/~ychi/publication/tweb08_splog.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Reduced inequalities","score":0.5699999928474426,"id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W44499633","https://openalex.org/W106005634","https://openalex.org/W160659377","https://openalex.org/W169395954","https://openalex.org/W172410088","https://openalex.org/W202878612","https://openalex.org/W1533946607","https://openalex.org/W1845137714","https://openalex.org/W1976446088","https://openalex.org/W1987365175","https://openalex.org/W1995973731","https://openalex.org/W2066055909","https://openalex.org/W2072410439","https://openalex.org/W2073562093","https://openalex.org/W2095293504","https://openalex.org/W2099593264","https://openalex.org/W2099789730","https://openalex.org/W2102232904","https://openalex.org/W2128272588","https://openalex.org/W2131408881","https://openalex.org/W2139148100","https://openalex.org/W2153635508","https://openalex.org/W2169270715","https://openalex.org/W2169470206","https://openalex.org/W2185352626","https://openalex.org/W2280861083","https://openalex.org/W2401383085","https://openalex.org/W2476149483","https://openalex.org/W2799061466","https://openalex.org/W2913332048","https://openalex.org/W2914885528","https://openalex.org/W4243799827"],"related_works":["https://openalex.org/W4296209631","https://openalex.org/W2561617217","https://openalex.org/W2107628111","https://openalex.org/W4294811468","https://openalex.org/W2355801475","https://openalex.org/W106004901","https://openalex.org/W2394004323","https://openalex.org/W2170062176","https://openalex.org/W4206659427","https://openalex.org/W2398764543"],"abstract_inverted_index":{"This":[0],"article":[1],"addresses":[2],"the":[3,47,67,84,130,139,145,155,159,165,175,189,208,243,248],"problem":[4,61],"of":[5,15,49,69,94,102,144,151,158,191,202,242,247],"spam":[6],"blog":[7,88,131,166,233],"(splog)":[8],"detection":[9,60,125],"using":[10,134,169,265],"temporal":[11,113,132,156,167,204,210],"and":[12,19,42,115,148,185,195],"structural":[13],"regularity":[14],"content,":[16,147],"post":[17,160],"time":[18],"links.":[20],"Splogs":[21],"are":[22,109,118,219],"undesirable":[23],"blogs":[24,192,194],"meant":[25],"to":[26,66,153,206],"attract":[27],"search":[28,50],"engine":[29,51],"traffic,":[30],"used":[31],"solely":[32],"for":[33,79],"promoting":[34],"affiliate":[35],"sites.":[36],"Blogs":[37],"represent":[38,129],"popular":[39],"online":[40],"media,":[41],"splogs":[43,108],"not":[44],"only":[45],"degrade":[46],"quality":[48],"results,":[52],"but":[53],"also":[54],"waste":[55],"network":[56],"resources.":[57],"The":[58,178,245],"splog":[59,124,209,214,263],"is":[62,89,251],"made":[63],"difficult":[64],"due":[65],"lack":[68],"stable":[70],"content":[71,222,228],"descriptors.":[72],"We":[73,128,163,198,225,258],"have":[74,259],"developed":[75],"a":[76,87,90,100,170,227],"new":[77],"technique":[78],"detecting":[80],"splogs,":[81],"based":[82,223,229],"on":[83,138,188,268],"observation":[85],"that":[86],"dynamic,":[91],"growing":[92],"sequence":[93],"entries":[95],"(or":[96],"posts)":[97],"rather":[98],"than":[99],"collection":[101],"individual":[103],"pages.":[104],"In":[105,212],"our":[106,123,213],"approach,":[107],"recognized":[110],"by":[111,253],"their":[112],"characteristics":[114,168],"content.":[116],"There":[117],"three":[119],"key":[120],"ideas":[121],"in":[122],"framework.":[126],"(a)":[127],"dynamics":[133],"self-similarity":[135,176],"matrices":[136],"defined":[137],"histogram":[140],"intersection":[141],"similarity":[142],"measure":[143],"time,":[146],"link":[149],"attributes":[150,184],"posts,":[152,186],"investigate":[154],"changes":[157],"sequence.":[161],"(b)":[162],"study":[164],"visual":[171,179],"representation":[172],"derived":[173],"from":[174,232,239],"measures.":[177],"signature":[180],"reveals":[181],"correlation":[182],"between":[183],"depending":[187],"type":[190],"(normal":[193],"splogs).":[196],"(c)":[197],"propose":[199],"two":[200],"types":[201],"novel":[203,217],"features":[205,218,267],"capture":[207],"characteristics.":[211],"detector,":[215],"these":[216],"combined":[220],"with":[221,272],"features.":[224],"extract":[226],"feature":[230,249],"vector":[231,250],"home":[234],"pages":[235],"as":[236,238],"well":[237],"different":[240],"parts":[241],"blog.":[244],"dimensionality":[246],"reduced":[252],"Fisher":[254],"linear":[255],"discriminant":[256],"analysis.":[257],"tested":[260],"an":[261],"SVM-based":[262],"detector":[264],"proposed":[266],"real":[269],"world":[270],"datasets,":[271],"appreciable":[273],"results":[274],"(90%":[275],"accuracy).":[276]},"counts_by_year":[{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":3},{"year":2014,"cited_by_count":2},{"year":2013,"cited_by_count":4},{"year":2012,"cited_by_count":5}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
