{"id":"https://openalex.org/W2182847203","doi":"https://doi.org/10.1109/dsaa.2015.7344831","title":"A context-aware approach to detection of short irrelevant texts","display_name":"A context-aware approach to detection of short irrelevant texts","publication_year":2015,"publication_date":"2015-10-01","ids":{"openalex":"https://openalex.org/W2182847203","doi":"https://doi.org/10.1109/dsaa.2015.7344831","mag":"2182847203"},"language":"en","primary_location":{"id":"doi:10.1109/dsaa.2015.7344831","is_oa":false,"landing_page_url":"https://doi.org/10.1109/dsaa.2015.7344831","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2015 IEEE International Conference on Data Science and Advanced Analytics (DSAA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102861459","display_name":"Sihong Xie","orcid":"https://orcid.org/0000-0001-5741-9740"},"institutions":[{"id":"https://openalex.org/I39422238","display_name":"University of Illinois Chicago","ror":"https://ror.org/02mpq6x41","country_code":"US","type":"education","lineage":["https://openalex.org/I39422238"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Sihong Xie","raw_affiliation_strings":["Department of Computer Science, University of Illinois at Chicago, Chicago, IL, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Illinois at Chicago, Chicago, IL, USA","institution_ids":["https://openalex.org/I39422238"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103365400","display_name":"Jing Wang","orcid":"https://orcid.org/0009-0003-7041-994X"},"institutions":[{"id":"https://openalex.org/I39422238","display_name":"University of Illinois Chicago","ror":"https://ror.org/02mpq6x41","country_code":"US","type":"education","lineage":["https://openalex.org/I39422238"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jing Wang","raw_affiliation_strings":["Department of Computer Science, University of Illinois at Chicago, Chicago, IL, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Illinois at Chicago, Chicago, IL, USA","institution_ids":["https://openalex.org/I39422238"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056136571","display_name":"Mohammad Shafkat Amin","orcid":null},"institutions":[{"id":"https://openalex.org/I1316064682","display_name":"LinkedIn (United States)","ror":"https://ror.org/02fyxhe35","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I1316064682"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mohammad S. Amin","raw_affiliation_strings":["LinkedIn Corp, Mountain View, CA, USA"],"affiliations":[{"raw_affiliation_string":"LinkedIn Corp, Mountain View, CA, USA","institution_ids":["https://openalex.org/I1316064682"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025750109","display_name":"Baoshi Yan","orcid":null},"institutions":[{"id":"https://openalex.org/I1316064682","display_name":"LinkedIn (United States)","ror":"https://ror.org/02fyxhe35","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I1316064682"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Baoshi Yan","raw_affiliation_strings":["LinkedIn Corp, Mountain View, CA, USA"],"affiliations":[{"raw_affiliation_string":"LinkedIn Corp, Mountain View, CA, USA","institution_ids":["https://openalex.org/I1316064682"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038091890","display_name":"Anmol Bhasin","orcid":null},"institutions":[{"id":"https://openalex.org/I1316064682","display_name":"LinkedIn (United States)","ror":"https://ror.org/02fyxhe35","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I1316064682"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Anmol Bhasin","raw_affiliation_strings":["LinkedIn Corp, Mountain View, CA, USA"],"affiliations":[{"raw_affiliation_string":"LinkedIn Corp, Mountain View, CA, USA","institution_ids":["https://openalex.org/I1316064682"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109181755","display_name":"Clement Yu","orcid":null},"institutions":[{"id":"https://openalex.org/I39422238","display_name":"University of Illinois Chicago","ror":"https://ror.org/02mpq6x41","country_code":"US","type":"education","lineage":["https://openalex.org/I39422238"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Clement Yu","raw_affiliation_strings":["Department of Computer Science, University of Illinois at Chicago, Chicago, IL, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Illinois at Chicago, Chicago, IL, USA","institution_ids":["https://openalex.org/I39422238"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5036357902","display_name":"Philip S. Yu","orcid":"https://orcid.org/0000-0002-3491-5968"},"institutions":[{"id":"https://openalex.org/I39422238","display_name":"University of Illinois Chicago","ror":"https://ror.org/02mpq6x41","country_code":"US","type":"education","lineage":["https://openalex.org/I39422238"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Philip S. Yu","raw_affiliation_strings":["Department of Computer Science, University of Illinois at Chicago, Chicago, IL, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Illinois at Chicago, Chicago, IL, USA","institution_ids":["https://openalex.org/I39422238"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5102861459"],"corresponding_institution_ids":["https://openalex.org/I39422238"],"apc_list":null,"apc_paid":null,"fwci":1.5892,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.88022325,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"10"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7514772415161133},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.6048322916030884},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4853774309158325},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.42284440994262695},{"id":"https://openalex.org/keywords/history","display_name":"History","score":0.07550641894340515}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7514772415161133},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6048322916030884},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4853774309158325},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42284440994262695},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.07550641894340515},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/dsaa.2015.7344831","is_oa":false,"landing_page_url":"https://doi.org/10.1109/dsaa.2015.7344831","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2015 IEEE International Conference on Data Science and Advanced Analytics (DSAA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320328656","display_name":"Singapore Management University","ror":"https://ror.org/050qmg959"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":50,"referenced_works":["https://openalex.org/W203899762","https://openalex.org/W1527152942","https://openalex.org/W1573190978","https://openalex.org/W1714665356","https://openalex.org/W1758505613","https://openalex.org/W1880262756","https://openalex.org/W1918552589","https://openalex.org/W1970433929","https://openalex.org/W1975223096","https://openalex.org/W1979459060","https://openalex.org/W1984762104","https://openalex.org/W1993003681","https://openalex.org/W1999281295","https://openalex.org/W2013029404","https://openalex.org/W2016266039","https://openalex.org/W2046403398","https://openalex.org/W2047756776","https://openalex.org/W2055400882","https://openalex.org/W2063698478","https://openalex.org/W2101536553","https://openalex.org/W2103063352","https://openalex.org/W2112213600","https://openalex.org/W2121871834","https://openalex.org/W2123449924","https://openalex.org/W2128309578","https://openalex.org/W2129862897","https://openalex.org/W2139317750","https://openalex.org/W2151348518","https://openalex.org/W2159359879","https://openalex.org/W2161443453","https://openalex.org/W2165698076","https://openalex.org/W2167265881","https://openalex.org/W2171836785","https://openalex.org/W2189187207","https://openalex.org/W2278871742","https://openalex.org/W2393901657","https://openalex.org/W2396895200","https://openalex.org/W2401383085","https://openalex.org/W2405765071","https://openalex.org/W2547416858","https://openalex.org/W2845409342","https://openalex.org/W2853043441","https://openalex.org/W2859520785","https://openalex.org/W4213099427","https://openalex.org/W4231856373","https://openalex.org/W4285719527","https://openalex.org/W6677885705","https://openalex.org/W6687142891","https://openalex.org/W6712844215","https://openalex.org/W6729310784"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052","https://openalex.org/W4402327032","https://openalex.org/W3204019825"],"abstract_inverted_index":{"This":[0],"paper":[1],"presents":[2],"a":[3,22,69,128,140,162,181,221,246],"simple":[4],"and":[5,17,24,32,42,65,76,92,105,112,147,192,240,243],"effective":[6],"framework":[7],"that":[8],"can":[9],"detect":[10],"irrelevant":[11,50,66,88],"short":[12,218],"text":[13,99],"contents":[14],"following":[15,103],"blogs":[16],"news":[18,104,239],"articles,":[19,41],"etc.":[20],"in":[21,161,220,251],"context-aware":[23,222],"timely":[25],"fashion.":[26],"Nowadays,":[27],"websites":[28,60],"such":[29],"as":[30,90,94],"Linkedin.com":[31],"CNN.com":[33],"allow":[34],"their":[35],"visitors":[36],"to":[37,48,85,118,139,152,156,212],"leave":[38],"comments":[39,67,89,102,131,170,178],"after":[40,133],"spammers":[43],"are":[44,108],"exploiting":[45],"this":[46],"feature":[47],"post":[49],"contents.":[51],"Visited":[52],"by":[53,110],"millions":[54],"of":[55,78,130,143,174,197,204,217,228,238,249],"readers":[56],"per":[57],"day,":[58],"these":[59,79,87],"have":[61,68],"extremely":[62],"high":[63],"visibility,":[64],"detrimental":[70],"effect":[71],"on":[72,232],"the":[73,158,190,201,215,226,229],"visiting":[74],"traffic":[75],"revenue":[77],"websites.":[80],"Therefore,":[81],"it":[82,116],"is":[83,136],"critical":[84],"eliminate":[86],"accurately":[91],"early":[93,202],"possible.":[95],"Different":[96],"from":[97],"traditional":[98,208],"mining":[100],"tasks,":[101],"blog":[106,241],"articles":[107,242],"characterized":[109],"briefness":[111],"context-dependent":[113,195],"semantics,":[114],"making":[115],"difficult":[117],"measure":[119],"semantic":[120],"relevance.":[121],"What's":[122],"worse,":[123],"there":[124],"could":[125],"be":[126],"only":[127],"handful":[129],"soon":[132],"an":[134],"article":[135],"posted,":[137],"leading":[138],"severe":[141],"lack":[142],"information":[144],"for":[145,169],"semantics":[146,196,216],"relevance":[148],"measurement.":[149],"We":[150,224],"propose":[151],"infer":[153],"\u201ccontext-aware":[154],"semantics\u201d":[155],"address":[157],"above":[159],"challenges":[160],"unified":[163],"framework.":[164],"Specifically,":[165],"we":[166],"construct":[167],"contexts":[168,188],"using":[171],"either":[172],"blocks":[173],"surrounding":[175],"comments,":[176,198,244],"or":[177],"collected":[179],"via":[180],"principled":[182],"transfer":[183],"learning":[184],"approach.":[185],"The":[186],"constructed":[187],"mitigate":[189],"sparseness":[191],"sharply":[193],"define":[194],"even":[199],"at":[200],"stage":[203],"commenting":[205],"activities,":[206],"allowing":[207],"dimension":[209],"reduction":[210],"methods":[211],"better":[213],"capture":[214],"texts":[219],"way.":[223],"confirm":[225],"effectiveness":[227],"proposed":[230],"method":[231],"two":[233],"real":[234],"world":[235],"datasets":[236],"consisting":[237],"with":[245],"maximal":[247],"improvement":[248],"20%":[250],"Area":[252],"Under":[253],"Precision-Recall":[254],"Curve.":[255]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
