{"id":"https://openalex.org/W2077916364","doi":"https://doi.org/10.1145/2505515.2505709","title":"On sparsity and drift for effective real-time filtering in microblogs","display_name":"On sparsity and drift for effective real-time filtering in microblogs","publication_year":2013,"publication_date":"2013-10-27","ids":{"openalex":"https://openalex.org/W2077916364","doi":"https://doi.org/10.1145/2505515.2505709","mag":"2077916364"},"language":"en","primary_location":{"id":"doi:10.1145/2505515.2505709","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2505515.2505709","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 22nd ACM international conference on Information &amp; Knowledge Management","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5001632477","display_name":"M\u2010Dyaa Albakour","orcid":null},"institutions":[{"id":"https://openalex.org/I7882870","display_name":"University of Glasgow","ror":"https://ror.org/00vtgdb53","country_code":"GB","type":"education","lineage":["https://openalex.org/I7882870"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"M-Dyaa Albakour","raw_affiliation_strings":["University of Glasgow, Glasgow, United Kingdom","University of Glasgow, Glasgow, United Kingdom#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Glasgow, Glasgow, United Kingdom","institution_ids":["https://openalex.org/I7882870"]},{"raw_affiliation_string":"University of Glasgow, Glasgow, United Kingdom#TAB#","institution_ids":["https://openalex.org/I7882870"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057643560","display_name":"Craig Macdonald","orcid":"https://orcid.org/0000-0003-3143-279X"},"institutions":[{"id":"https://openalex.org/I7882870","display_name":"University of Glasgow","ror":"https://ror.org/00vtgdb53","country_code":"GB","type":"education","lineage":["https://openalex.org/I7882870"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Craig Macdonald","raw_affiliation_strings":["University of Glasgow, Glasgow, United Kingdom","University of Glasgow, Glasgow, United Kingdom#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Glasgow, Glasgow, United Kingdom","institution_ids":["https://openalex.org/I7882870"]},{"raw_affiliation_string":"University of Glasgow, Glasgow, United Kingdom#TAB#","institution_ids":["https://openalex.org/I7882870"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5079046603","display_name":"Iadh Ounis","orcid":"https://orcid.org/0000-0003-4701-3223"},"institutions":[{"id":"https://openalex.org/I7882870","display_name":"University of Glasgow","ror":"https://ror.org/00vtgdb53","country_code":"GB","type":"education","lineage":["https://openalex.org/I7882870"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Iadh Ounis","raw_affiliation_strings":["University of Glasgow, Glasgow, United Kingdom","University of Glasgow, Glasgow, United Kingdom#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Glasgow, Glasgow, United Kingdom","institution_ids":["https://openalex.org/I7882870"]},{"raw_affiliation_string":"University of Glasgow, Glasgow, United Kingdom#TAB#","institution_ids":["https://openalex.org/I7882870"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":3.9969,"has_fulltext":false,"cited_by_count":35,"citation_normalized_percentile":{"value":0.94023181,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"419","last_page":"428"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10064","display_name":"Complex Network Analysis Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10064","display_name":"Complex Network Analysis Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/microblogging","display_name":"Microblogging","score":0.9178342819213867},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8292018175125122},{"id":"https://openalex.org/keywords/social-media","display_name":"Social media","score":0.7861393094062805},{"id":"https://openalex.org/keywords/concept-drift","display_name":"Concept drift","score":0.7077904343605042},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.6055539846420288},{"id":"https://openalex.org/keywords/relevance","display_name":"Relevance (law)","score":0.5963178873062134},{"id":"https://openalex.org/keywords/term","display_name":"Term (time)","score":0.5438041090965271},{"id":"https://openalex.org/keywords/streaming-data","display_name":"Streaming data","score":0.50179123878479},{"id":"https://openalex.org/keywords/event","display_name":"Event (particle physics)","score":0.4832761883735657},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4828386902809143},{"id":"https://openalex.org/keywords/relevance-feedback","display_name":"Relevance feedback","score":0.4321925640106201},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.41591209173202515},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.31934502720832825},{"id":"https://openalex.org/keywords/data-stream-mining","display_name":"Data stream mining","score":0.27525055408477783},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.2027759850025177},{"id":"https://openalex.org/keywords/image-retrieval","display_name":"Image retrieval","score":0.08137613534927368}],"concepts":[{"id":"https://openalex.org/C143275388","wikidata":"https://www.wikidata.org/wiki/Q92438","display_name":"Microblogging","level":3,"score":0.9178342819213867},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8292018175125122},{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.7861393094062805},{"id":"https://openalex.org/C60777511","wikidata":"https://www.wikidata.org/wiki/Q3045002","display_name":"Concept drift","level":3,"score":0.7077904343605042},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.6055539846420288},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.5963178873062134},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.5438041090965271},{"id":"https://openalex.org/C2777611316","wikidata":"https://www.wikidata.org/wiki/Q39045282","display_name":"Streaming data","level":2,"score":0.50179123878479},{"id":"https://openalex.org/C2779662365","wikidata":"https://www.wikidata.org/wiki/Q5416694","display_name":"Event (particle physics)","level":2,"score":0.4832761883735657},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4828386902809143},{"id":"https://openalex.org/C2779532271","wikidata":"https://www.wikidata.org/wiki/Q445558","display_name":"Relevance feedback","level":4,"score":0.4321925640106201},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.41591209173202515},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.31934502720832825},{"id":"https://openalex.org/C89198739","wikidata":"https://www.wikidata.org/wiki/Q3079880","display_name":"Data stream mining","level":2,"score":0.27525055408477783},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.2027759850025177},{"id":"https://openalex.org/C1667742","wikidata":"https://www.wikidata.org/wiki/Q10927554","display_name":"Image retrieval","level":3,"score":0.08137613534927368},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2505515.2505709","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2505515.2505709","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 22nd ACM international conference on Information &amp; Knowledge Management","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":34,"referenced_works":["https://openalex.org/W9861414","https://openalex.org/W73128518","https://openalex.org/W1524345994","https://openalex.org/W1549229937","https://openalex.org/W1970461679","https://openalex.org/W1972594981","https://openalex.org/W1978239142","https://openalex.org/W1979459060","https://openalex.org/W1985277880","https://openalex.org/W1990821053","https://openalex.org/W2000200507","https://openalex.org/W2036543198","https://openalex.org/W2053968437","https://openalex.org/W2055400882","https://openalex.org/W2056952906","https://openalex.org/W2062614982","https://openalex.org/W2091825929","https://openalex.org/W2098766443","https://openalex.org/W2098825757","https://openalex.org/W2106365165","https://openalex.org/W2110891465","https://openalex.org/W2124499489","https://openalex.org/W2153756419","https://openalex.org/W2155482025","https://openalex.org/W2164547069","https://openalex.org/W2187652355","https://openalex.org/W2339562433","https://openalex.org/W2341079710","https://openalex.org/W2643544958","https://openalex.org/W4231856373","https://openalex.org/W6661805154","https://openalex.org/W6684151790","https://openalex.org/W6703967046","https://openalex.org/W6704412327"],"related_works":["https://openalex.org/W4281572076","https://openalex.org/W2917311036","https://openalex.org/W3041820423","https://openalex.org/W2601363847","https://openalex.org/W3155148637","https://openalex.org/W2981673118","https://openalex.org/W3007751950","https://openalex.org/W4385399313","https://openalex.org/W2068319486","https://openalex.org/W2759864402"],"abstract_inverted_index":{"In":[0,47,63],"this":[1],"paper,":[2],"we":[3,50,96,122,148,175],"approach":[4,179],"the":[5,11,42,68,79,83,86,92,111,115,124,130,133,140,144,170,191,208],"problem":[6],"of":[7,41,70,85,110,132,185,210],"real-time":[8],"filtering":[9,21,187,202],"in":[10,45,58,143],"Twitter":[12,155],"Microblogging":[13],"platform.":[14],"We":[15],"adapt":[16],"an":[17,150],"effective":[18,181],"traditional":[19],"news":[20,201],"technique,":[22],"which":[23,163],"uses":[24],"a":[25,39,107,183],"text":[26],"classifier":[27],"inspired":[28],"by":[29],"Rocchio's":[30],"relevance":[31],"feedback":[32],"algorithm,":[33],"to":[34,78,90,100,118,127,159],"build":[35],"and":[36,61,139,156,194],"dynamically":[37],"update":[38],"profile":[40,126],"user's":[43,192],"interests":[44,84,113,142],"real-time.":[46],"our":[48,178],"adaptation,":[49],"tackle":[51,91],"two":[52],"challenges":[53],"that":[54,177,195],"are":[55],"particularly":[56],"prevalent":[57],"Twitter:":[59],"sparsity":[60,65,94],"drift.":[62],"particular,":[64],"stems":[66],"from":[67,154],"brevity":[69],"tweets,":[71],"while":[72],"drift":[73,164],"occurs":[74],"as":[75,190],"events":[76],"related":[77,104],"topic":[80,215],"develop":[81],"or":[82,103],"user":[87,112,125],"change.":[88],"First,":[89],"acute":[93],"problem,":[95],"apply":[97],"query":[98],"expansion":[99],"derive":[101],"terms":[102],"tweets":[105],"for":[106,182],"richer":[108],"initialisation":[109],"within":[114],"profile.":[116],"Second,":[117],"deal":[119],"with":[120,199],"drift,":[121],"modify":[123],"balance":[128],"between":[129],"importance":[131],"short-term":[134],"interests,":[135],"i.e.":[136],"emerging":[137],"subtopics,":[138],"long-term":[141],"overall":[145],"topic.":[146],"Moreover,":[147],"investigate":[149],"event":[151],"detection":[152],"method":[153],"newswire":[157],"streams":[158],"predict":[160],"times":[161],"at":[162],"may":[165],"happen.":[166],"Through":[167],"experiments":[168],"using":[169],"TREC":[171],"Microblog":[172],"track":[173],"2012,":[174],"show":[176],"is":[180],"number":[184],"common":[186],"metrics":[188],"such":[189],"utility,":[193],"it":[196],"compares":[197],"favourably":[198],"state-of-the-art":[200],"baselines.":[203],"Our":[204],"results":[205],"also":[206],"uncover":[207],"impact":[209],"different":[211],"factors":[212],"on":[213],"handling":[214],"drifting.":[216]},"counts_by_year":[{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":4},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":6},{"year":2017,"cited_by_count":3},{"year":2016,"cited_by_count":7},{"year":2015,"cited_by_count":7},{"year":2014,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
