{"id":"https://openalex.org/W2047324573","doi":"https://doi.org/10.1145/1571941.1572157","title":"Sifting micro-blogging stream for events of user interest","display_name":"Sifting micro-blogging stream for events of user interest","publication_year":2009,"publication_date":"2009-07-19","ids":{"openalex":"https://openalex.org/W2047324573","doi":"https://doi.org/10.1145/1571941.1572157","mag":"2047324573"},"language":"en","primary_location":{"id":"doi:10.1145/1571941.1572157","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1571941.1572157","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd international ACM SIGIR conference on Research and development in information retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5108451635","display_name":"Maxim Grinev","orcid":null},"institutions":[{"id":"https://openalex.org/I4210101868","display_name":"Institute for System Programming","ror":"https://ror.org/017ef8252","country_code":"RU","type":"facility","lineage":["https://openalex.org/I1313323035","https://openalex.org/I4210101868","https://openalex.org/I4210124601"]}],"countries":["RU"],"is_corresponding":true,"raw_author_name":"Maxim Grinev","raw_affiliation_strings":["Institute for System Programming of the Russian Academy of Sciences, Moscow, Russian Fed"],"affiliations":[{"raw_affiliation_string":"Institute for System Programming of the Russian Academy of Sciences, Moscow, Russian Fed","institution_ids":["https://openalex.org/I4210101868"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031395328","display_name":"Maria Grineva","orcid":null},"institutions":[{"id":"https://openalex.org/I4210101868","display_name":"Institute for System Programming","ror":"https://ror.org/017ef8252","country_code":"RU","type":"facility","lineage":["https://openalex.org/I1313323035","https://openalex.org/I4210101868","https://openalex.org/I4210124601"]}],"countries":["RU"],"is_corresponding":false,"raw_author_name":"Maria Grineva","raw_affiliation_strings":["Institute for System Programming of the Russian Academy of Sciences, Moscow, Russian Fed"],"affiliations":[{"raw_affiliation_string":"Institute for System Programming of the Russian Academy of Sciences, Moscow, Russian Fed","institution_ids":["https://openalex.org/I4210101868"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053980142","display_name":"Alexander Boldakov","orcid":null},"institutions":[{"id":"https://openalex.org/I4210101868","display_name":"Institute for System Programming","ror":"https://ror.org/017ef8252","country_code":"RU","type":"facility","lineage":["https://openalex.org/I1313323035","https://openalex.org/I4210101868","https://openalex.org/I4210124601"]}],"countries":["RU"],"is_corresponding":false,"raw_author_name":"Alexander Boldakov","raw_affiliation_strings":["Institute for System Programming of the Russian Academy of Sciences, Moscow, Russian Fed"],"affiliations":[{"raw_affiliation_string":"Institute for System Programming of the Russian Academy of Sciences, Moscow, Russian Fed","institution_ids":["https://openalex.org/I4210101868"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008552844","display_name":"Leonid Novak","orcid":null},"institutions":[{"id":"https://openalex.org/I4210101868","display_name":"Institute for System Programming","ror":"https://ror.org/017ef8252","country_code":"RU","type":"facility","lineage":["https://openalex.org/I1313323035","https://openalex.org/I4210101868","https://openalex.org/I4210124601"]}],"countries":["RU"],"is_corresponding":false,"raw_author_name":"Leonid Novak","raw_affiliation_strings":["Institute for System Programming of the Russian Academy of Sciences, Moscow, Russian Fed"],"affiliations":[{"raw_affiliation_string":"Institute for System Programming of the Russian Academy of Sciences, Moscow, Russian Fed","institution_ids":["https://openalex.org/I4210101868"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049616432","display_name":"Andrey Syssoev","orcid":null},"institutions":[{"id":"https://openalex.org/I4210101868","display_name":"Institute for System Programming","ror":"https://ror.org/017ef8252","country_code":"RU","type":"facility","lineage":["https://openalex.org/I1313323035","https://openalex.org/I4210101868","https://openalex.org/I4210124601"]}],"countries":["RU"],"is_corresponding":false,"raw_author_name":"Andrey Syssoev","raw_affiliation_strings":["Institute for System Programming of the Russian Academy of Sciences, Moscow, Russian Fed"],"affiliations":[{"raw_affiliation_string":"Institute for System Programming of the Russian Academy of Sciences, Moscow, Russian Fed","institution_ids":["https://openalex.org/I4210101868"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5031099526","display_name":"Dmitry Lizorkin","orcid":null},"institutions":[{"id":"https://openalex.org/I4210101868","display_name":"Institute for System Programming","ror":"https://ror.org/017ef8252","country_code":"RU","type":"facility","lineage":["https://openalex.org/I1313323035","https://openalex.org/I4210101868","https://openalex.org/I4210124601"]}],"countries":["RU"],"is_corresponding":false,"raw_author_name":"Dmitry Lizorkin","raw_affiliation_strings":["Institute for System Programming of the Russian Academy of Sciences, Moscow, Russian Fed"],"affiliations":[{"raw_affiliation_string":"Institute for System Programming of the Russian Academy of Sciences, Moscow, Russian Fed","institution_ids":["https://openalex.org/I4210101868"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5108451635"],"corresponding_institution_ids":["https://openalex.org/I4210101868"],"apc_list":null,"apc_paid":null,"fwci":4.9556,"has_fulltext":false,"cited_by_count":29,"citation_normalized_percentile":{"value":0.950816,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"837","last_page":"837"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10799","display_name":"Data Visualization and Analytics","score":0.9765999913215637,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10064","display_name":"Complex Network Analysis Techniques","score":0.9574000239372253,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6724278926849365},{"id":"https://openalex.org/keywords/microblogging","display_name":"Microblogging","score":0.6265971064567566},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.3423624038696289},{"id":"https://openalex.org/keywords/social-media","display_name":"Social media","score":0.3201953172683716}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6724278926849365},{"id":"https://openalex.org/C143275388","wikidata":"https://www.wikidata.org/wiki/Q92438","display_name":"Microblogging","level":3,"score":0.6265971064567566},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.3423624038696289},{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.3201953172683716}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/1571941.1572157","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1571941.1572157","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd international ACM SIGIR conference on Research and development in information retrieval","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.565.4701","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.565.4701","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://mint.typepad.com/mypapers/demo-tweet-sieve.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":4,"referenced_works":["https://openalex.org/W1485672862","https://openalex.org/W2135342207","https://openalex.org/W2145049651","https://openalex.org/W6680250353"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2728430307","https://openalex.org/W2107786128","https://openalex.org/W2053241453","https://openalex.org/W2153980712","https://openalex.org/W2537388533","https://openalex.org/W2978974359","https://openalex.org/W2021183651","https://openalex.org/W2036556872","https://openalex.org/W2017590198"],"abstract_inverted_index":{"Micro-blogging":[0],"is":[1,43,76,85,157,170,188,285,317,392,447],"a":[2,33,77,101,112,125,168,268,355,364,505],"new":[3,145,506],"form":[4],"of":[5,35,51,79,95,97,104,115,128,136,141,175,231,243,310,323,336,349,357,371,405,424,440,487,490,497,508],"social":[6,116],"communication":[7],"that":[8,120,197,219,270,345,416,446],"encourages":[9],"users":[10],"to":[11,27,49,61,67,287,291,319,450,461,464,504],"share":[12],"information":[13,82],"about":[14,83],"anything":[15],"they":[16],"are":[17,54,399],"seeing":[18],"or":[19,259],"doing,":[20],"the":[21,25,38,88,93,149,161,165,200,210,228,232,244,262,280,303,315,321,334,340,350,358,378,381,385,389,397,403,408,412,422,428,437,472,477,485,495],"motivation":[22],"facilitated":[23],"by":[24,57,278,326,401],"ability":[26],"post":[28],"brief":[29],"text":[30],"messages":[31,196,245,379,415,426,458,470],"through":[32],"variety":[34],"devices.":[36],"Twitter,":[37],"most":[39,473],"popular":[40,113],"micro-blogging":[41,162],"tool,":[42],"exhibiting":[44],"rapid":[45],"growth":[46],"[3]:":[47],"up":[48],"11%":[50],"online":[52],"Americans":[53],"using":[55],"Twitter":[56,281],"December":[58],"2008,":[59],"compared":[60],"6%":[62],"in":[63,87,143,160,235,246,253,300,308,384,396,431,500],"May":[64],"2008.":[65],"Due":[66],"its":[68],"nature,":[69],"micro-blogosphere":[70,109,142],"has":[71,122],"unique":[72],"features:":[73],"(i)":[74],"It":[75,91],"source":[78,127],"extremely":[80,129],"up-to-date":[81,130],"what":[84],"happening":[86],"world;":[89],"(ii)":[90],"captures":[92],"wisdom":[94],"millions":[96],"people":[98],"and":[99,193,208,297,342,467,510],"covers":[100],"broad":[102],"range":[103],"domains.":[105],"These":[106],"features":[107],"make":[108,207],"more":[110,225],"than":[111,227,307],"medium":[114],"communication:":[117],"we":[118,147,206,435,480],"believe":[119],"it":[121],"additionally":[123],"become":[124],"valuable":[126],"news":[131,176,273,419,502],"on":[132,164,177,274],"virtually":[133],"any":[134,154,275],"subject":[135,156,233,277,322,341],"user":[137,221,316],"interest.":[138],"Making":[139],"use":[140,481],"this":[144,178],"role":[146],"meet":[148],"following":[150,211],"challenges:":[151],"(A)":[152,213],"Since":[153],"given":[155,276],"generally":[158],"mentioned":[159],"stream":[163,186,386],"continuous":[166],"basis,":[167],"method":[169],"needed":[171],"for":[172,183,190,194,239,339,360,484],"locating":[173],"periods":[174,404],"subject.":[179,366],"(B)":[180,241],"Additionally,":[181],"even":[182],"such":[184],"periods,":[185],"filtering":[187,452],"required":[189],"removing":[191],"noise":[192],"extracting":[195],"best":[198,346,417],"describe":[199,250,347,418],"news.":[201],"To":[202],"address":[203],"these":[204],"challenges":[205],"exploit":[209],"observations:":[212],"For":[214,421],"an":[215,247,327,432],"arbitrary":[216,328],"subject,":[217],"events":[218,337],"catch":[220],"interest":[222,325],"gain":[223],"distinguishably":[224],"attention":[226],"average":[229],"mentioning":[230],"resulting":[234],"message":[236],"activity":[237,248,375,433],"bursts":[238,395],"it.":[240],"Most":[242],"burst":[249],"common":[251],"event":[252],"close":[254],"variations":[255],"-":[256,267],"either":[257],"rephrased":[258],"\"retweeted\"":[260],"between":[261],"users.":[263],"We":[264],"demonstrate":[265],"TweetSieve":[266,313],"system":[269,332,359],"allows":[271],"obtaining":[272],"sifting":[279],"stream.":[282],"Our":[283],"work":[284],"related":[286],"frequecy-based":[288],"analysis":[289,304],"applied":[290],"blogs":[292,301],"[1],":[293],"but":[294],"higher":[295],"latency":[296],"lower":[298],"coverage":[299,511],"makes":[302],"less":[305],"effective":[306],"case":[309],"micro-blogs.":[311],"In":[312],"demo,":[314],"able":[318],"express":[320],"her":[324],"search":[329,382,429],"string.":[330],"The":[331,367,455,492],"shows":[333,354],"period":[335],"occuring":[338],"outputs":[343],"tweets":[344],"each":[348,465],"events.":[351,420],"Figure":[352],"1":[353],"screenshot":[356],"\"Semantic":[361],"search\"":[362],"as":[363],"sample":[365],"underlying":[368],"process":[369],"consists":[370],"two":[372],"steps:":[373],"Identifying":[374],"bursts.":[376],"Counting":[377],"matching":[380,427],"string":[383,430],"over":[387],"time,":[388],"frequency":[390,406],"curve":[391,398],"constructed.":[393],"Activity":[394],"identified":[400],"taking":[402],"exceeding":[407],"standard":[409],"deviation":[410],"from":[411,471],"average.":[413],"Selecting":[414],"set":[423],"all":[425],"burst,":[434],"apply":[436],"message-granular":[438],"variation":[439],"our":[441,498],"keyphrase":[442],"extraction":[443],"algorithm":[444,456],"[2]":[445],"specifically":[448],"suited":[449],"efficiently":[451],"noisy":[453],"data.":[454],"clusters":[457],"with":[459],"respect":[460],"their":[462],"similarity":[463,478],"other":[466],"chooses":[468],"central":[469],"dense":[474],"clusters.":[475],"As":[476],"measure":[479],"Jaccard":[482],"coefficient":[483],"\"bag":[486],"words\"":[488],"representation":[489],"messages.":[491],"demonstration":[493],"illustrates":[494],"potential":[496],"approach":[499],"bringing":[501],"acquisition":[503],"level":[507],"promptness":[509],"range.":[512]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":1},{"year":2013,"cited_by_count":9},{"year":2012,"cited_by_count":5}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
