{"id":"https://openalex.org/W2296421757","doi":"https://doi.org/10.1109/bigcomp.2016.7425926","title":"An approach to spam comment detection through domain-independent features","display_name":"An approach to spam comment detection through domain-independent features","publication_year":2016,"publication_date":"2016-01-01","ids":{"openalex":"https://openalex.org/W2296421757","doi":"https://doi.org/10.1109/bigcomp.2016.7425926","mag":"2296421757"},"language":"en","primary_location":{"id":"doi:10.1109/bigcomp.2016.7425926","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigcomp.2016.7425926","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 International Conference on Big Data and Smart Computing (BigComp)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5035173149","display_name":"Jong Myoung Kim","orcid":null},"institutions":[{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]},{"id":"https://openalex.org/I4210134443","display_name":"Daejeon Institute of Science and Technology","ror":"https://ror.org/032qr1v70","country_code":"KR","type":"education","lineage":["https://openalex.org/I4210134443"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Jong Myoung Kim","raw_affiliation_strings":["Korea Advanced Institute of Science and Technology, Daejeon, Daejeon, KR"],"affiliations":[{"raw_affiliation_string":"Korea Advanced Institute of Science and Technology, Daejeon, Daejeon, KR","institution_ids":["https://openalex.org/I4210134443","https://openalex.org/I157485424"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010702241","display_name":"Zae Myung Kim","orcid":"https://orcid.org/0000-0002-2572-6348"},"institutions":[{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Zae Myung Kim","raw_affiliation_strings":["School of Computing, Korea Advanced Institute of Science and Technology (KAIST)"],"affiliations":[{"raw_affiliation_string":"School of Computing, Korea Advanced Institute of Science and Technology (KAIST)","institution_ids":["https://openalex.org/I157485424"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5039785089","display_name":"Kwangjo Kim","orcid":"https://orcid.org/0000-0002-8922-6203"},"institutions":[{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Kwangjo Kim","raw_affiliation_strings":["School of Computing, Korea Advanced Institute of Science and Technology (KAIST)"],"affiliations":[{"raw_affiliation_string":"School of Computing, Korea Advanced Institute of Science and Technology (KAIST)","institution_ids":["https://openalex.org/I157485424"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5035173149"],"corresponding_institution_ids":["https://openalex.org/I157485424","https://openalex.org/I4210134443"],"apc_list":null,"apc_paid":null,"fwci":3.3174,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.92864191,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"273","last_page":"276"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8260781764984131},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.7053874135017395},{"id":"https://openalex.org/keywords/bag-of-words-model","display_name":"Bag-of-words model","score":0.637081503868103},{"id":"https://openalex.org/keywords/measure","display_name":"Measure (data warehouse)","score":0.6264214515686035},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5967081189155579},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5948459506034851},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.5636268258094788},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.5636101961135864},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.5355619788169861},{"id":"https://openalex.org/keywords/feature-vector","display_name":"Feature vector","score":0.5297435522079468},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.5296164751052856},{"id":"https://openalex.org/keywords/similarity-measure","display_name":"Similarity measure","score":0.5128524303436279},{"id":"https://openalex.org/keywords/spamming","display_name":"Spamming","score":0.4878659248352051},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.47283467650413513},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4686911106109619},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.4356900155544281},{"id":"https://openalex.org/keywords/data-set","display_name":"Data set","score":0.42334532737731934},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.41731902956962585},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4101765751838684},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3488602042198181},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.22163748741149902},{"id":"https://openalex.org/keywords/the-internet","display_name":"The Internet","score":0.16135430335998535}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8260781764984131},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.7053874135017395},{"id":"https://openalex.org/C13672336","wikidata":"https://www.wikidata.org/wiki/Q3460803","display_name":"Bag-of-words model","level":2,"score":0.637081503868103},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.6264214515686035},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5967081189155579},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5948459506034851},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.5636268258094788},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.5636101961135864},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.5355619788169861},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.5297435522079468},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.5296164751052856},{"id":"https://openalex.org/C2776517306","wikidata":"https://www.wikidata.org/wiki/Q29017317","display_name":"Similarity measure","level":2,"score":0.5128524303436279},{"id":"https://openalex.org/C158955206","wikidata":"https://www.wikidata.org/wiki/Q83058","display_name":"Spamming","level":3,"score":0.4878659248352051},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.47283467650413513},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4686911106109619},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.4356900155544281},{"id":"https://openalex.org/C58489278","wikidata":"https://www.wikidata.org/wiki/Q1172284","display_name":"Data set","level":2,"score":0.42334532737731934},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.41731902956962585},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4101765751838684},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3488602042198181},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.22163748741149902},{"id":"https://openalex.org/C110875604","wikidata":"https://www.wikidata.org/wiki/Q75","display_name":"The Internet","level":2,"score":0.16135430335998535},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigcomp.2016.7425926","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigcomp.2016.7425926","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 International Conference on Big Data and Smart Computing (BigComp)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10","score":0.7400000095367432}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":12,"referenced_works":["https://openalex.org/W66884126","https://openalex.org/W1530636824","https://openalex.org/W2027719216","https://openalex.org/W2058737869","https://openalex.org/W2062614982","https://openalex.org/W2085302848","https://openalex.org/W2108335766","https://openalex.org/W2121871834","https://openalex.org/W2123442489","https://openalex.org/W2149684865","https://openalex.org/W6677885705","https://openalex.org/W7017059801"],"related_works":["https://openalex.org/W156213964","https://openalex.org/W2050960118","https://openalex.org/W3149865514","https://openalex.org/W2943490005","https://openalex.org/W2141479508","https://openalex.org/W2003072179","https://openalex.org/W2165805973","https://openalex.org/W3036941175","https://openalex.org/W2609539975","https://openalex.org/W4292167554"],"abstract_inverted_index":{"Previous":[0],"research":[1],"in":[2,6,23,39,123,143],"spam":[3,8,25,49,97,108],"detection,":[4],"especially":[5],"email":[7],"filtering,":[9],"mainly":[10],"focused":[11],"on":[12,161,175],"learning":[13,74,92],"a":[14,75,93],"set":[15,94],"of":[16,55,95,145,179],"discriminative":[17],"features":[18],"that":[19,44],"are":[20,32,115,165],"often":[21],"present":[22],"the":[24,35,62,65,100,112,119,124,129,133,147,152,157,169,176],"contents.":[26],"Nowadays,":[27],"these":[28],"commercially":[29],"oriented":[30],"spams":[31,43],"well":[33],"detected;":[34],"real":[36],"challenge":[37],"lies":[38],"filtering":[40],"rather":[41],"vague":[42],"do":[45],"not":[46],"exhibit":[47],"distinctive":[48],"keywords.":[50],"We":[51],"investigate":[52],"two":[53],"ways":[54],"detecting":[56,162],"such":[57,79],"spams:":[58],"1)":[59],"By":[60],"comparing":[61],"similarity":[63,141],"between":[64],"publisher":[66],"posts":[67],"and":[68,71,99,138],"user":[69,81],"comments,":[70],"2)":[72],"by":[73,183],"single":[76],"representative":[77],"meta-feature":[78],"as":[80],"name":[82],"or":[83],"ID.":[84],"The":[85],"first":[86,125,158],"measure":[87,102,142],"relieves":[88],"us":[89,104],"from":[90],"repetitively":[91],"domain-dependent":[96],"features,":[98],"second":[101,170],"enables":[103],"to":[105,118,150],"detect":[106],"potential":[107],"users":[109],"even":[110],"before":[111],"aggressive":[113],"actions":[114],"performed.":[116],"Prior":[117],"language":[120,148],"model":[121],"comparison":[122],"method,":[126],"we":[127,172],"supplement":[128],"background":[130],"information,":[131],"normalize":[132],"text,":[134],"perform":[135],"co-reference":[136],"resolution,":[137],"conduct":[139],"word-to-word":[140],"hope":[144],"enriching":[146],"models":[149],"improve":[151],"classification":[153],"accuracy.":[154],"To":[155],"evaluate":[156],"measure,":[159,171],"experiments":[160],"blog-spam":[163],"comments":[164],"conducted.":[166],"As":[167],"for":[168],"employ":[173],"SVM":[174],"ID":[177],"space":[178],"e-mail":[180],"data":[181],"collected":[182],"\u201cApache":[184],"Spam":[185],"Assassin\u201d.":[186]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
