{"id":"https://openalex.org/W4298251576","doi":"https://doi.org/10.1145/2817946.2817949","title":"On Predictability of Rare Events Leveraging Social Media","display_name":"On Predictability of Rare Events Leveraging Social Media","publication_year":2015,"publication_date":"2015-10-27","ids":{"openalex":"https://openalex.org/W4298251576","doi":"https://doi.org/10.1145/2817946.2817949"},"language":"en","primary_location":{"id":"doi:10.1145/2817946.2817949","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2817946.2817949","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2015 ACM on Conference on Online Social Networks","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102347070","display_name":"Lei Le","orcid":"https://orcid.org/0000-0002-0123-1586"},"institutions":[{"id":"https://openalex.org/I4210119109","display_name":"Indiana University Bloomington","ror":"https://ror.org/02k40bc56","country_code":"US","type":"education","lineage":["https://openalex.org/I4210119109","https://openalex.org/I592451"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Lei Le","raw_affiliation_strings":["Indiana University, Bloomington, IN, USA"],"affiliations":[{"raw_affiliation_string":"Indiana University, Bloomington, IN, USA","institution_ids":["https://openalex.org/I4210119109"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078699564","display_name":"Emilio Ferrara","orcid":"https://orcid.org/0000-0002-1942-2831"},"institutions":[{"id":"https://openalex.org/I4210119109","display_name":"Indiana University Bloomington","ror":"https://ror.org/02k40bc56","country_code":"US","type":"education","lineage":["https://openalex.org/I4210119109","https://openalex.org/I592451"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Emilio Ferrara","raw_affiliation_strings":["Indiana University, Bloomington, IN, USA"],"affiliations":[{"raw_affiliation_string":"Indiana University, Bloomington, IN, USA","institution_ids":["https://openalex.org/I4210119109"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5011228873","display_name":"Alessandro Flammini","orcid":"https://orcid.org/0000-0003-1670-9156"},"institutions":[{"id":"https://openalex.org/I4210119109","display_name":"Indiana University Bloomington","ror":"https://ror.org/02k40bc56","country_code":"US","type":"education","lineage":["https://openalex.org/I4210119109","https://openalex.org/I592451"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alessandro Flammini","raw_affiliation_strings":["Indiana University, Bloomington, IN, USA"],"affiliations":[{"raw_affiliation_string":"Indiana University, Bloomington, IN, USA","institution_ids":["https://openalex.org/I4210119109"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5102347070"],"corresponding_institution_ids":["https://openalex.org/I4210119109"],"apc_list":null,"apc_paid":null,"fwci":3.44284498,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.96175694,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"3","last_page":"13"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11674","display_name":"Sports Analytics and Performance","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/2002","display_name":"Economics and Econometrics"},"field":{"id":"https://openalex.org/fields/20","display_name":"Economics, Econometrics and Finance"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11674","display_name":"Sports Analytics and Performance","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/2002","display_name":"Economics and Econometrics"},"field":{"id":"https://openalex.org/fields/20","display_name":"Economics, Econometrics and Finance"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11326","display_name":"Stock Market Forecasting Methods","score":0.9825000166893005,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9731000065803528,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/social-media","display_name":"Social media","score":0.7804819941520691},{"id":"https://openalex.org/keywords/predictability","display_name":"Predictability","score":0.7333406805992126},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7200430631637573},{"id":"https://openalex.org/keywords/predictive-power","display_name":"Predictive power","score":0.6698694825172424},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.6421537399291992},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.5810720920562744},{"id":"https://openalex.org/keywords/sentiment-analysis","display_name":"Sentiment analysis","score":0.5807280540466309},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4708613455295563},{"id":"https://openalex.org/keywords/profit","display_name":"Profit (economics)","score":0.4554654061794281},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3950735628604889},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.21902528405189514},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.2039012610912323},{"id":"https://openalex.org/keywords/economics","display_name":"Economics","score":0.11310842633247375},{"id":"https://openalex.org/keywords/microeconomics","display_name":"Microeconomics","score":0.11238843202590942}],"concepts":[{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.7804819941520691},{"id":"https://openalex.org/C197640229","wikidata":"https://www.wikidata.org/wiki/Q2534066","display_name":"Predictability","level":2,"score":0.7333406805992126},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7200430631637573},{"id":"https://openalex.org/C2778136018","wikidata":"https://www.wikidata.org/wiki/Q10350689","display_name":"Predictive power","level":2,"score":0.6698694825172424},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.6421537399291992},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.5810720920562744},{"id":"https://openalex.org/C66402592","wikidata":"https://www.wikidata.org/wiki/Q2271421","display_name":"Sentiment analysis","level":2,"score":0.5807280540466309},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4708613455295563},{"id":"https://openalex.org/C181622380","wikidata":"https://www.wikidata.org/wiki/Q26911","display_name":"Profit (economics)","level":2,"score":0.4554654061794281},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3950735628604889},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.21902528405189514},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.2039012610912323},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.11310842633247375},{"id":"https://openalex.org/C175444787","wikidata":"https://www.wikidata.org/wiki/Q39072","display_name":"Microeconomics","level":1,"score":0.11238843202590942},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2817946.2817949","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2817946.2817949","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2015 ACM on Conference on Online Social Networks","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":37,"referenced_works":["https://openalex.org/W137217113","https://openalex.org/W153654188","https://openalex.org/W1515963492","https://openalex.org/W1590495275","https://openalex.org/W1853031019","https://openalex.org/W1964521983","https://openalex.org/W1971204783","https://openalex.org/W1974906280","https://openalex.org/W1983069677","https://openalex.org/W2004214228","https://openalex.org/W2015170579","https://openalex.org/W2015186536","https://openalex.org/W2018165284","https://openalex.org/W2028993035","https://openalex.org/W2037625889","https://openalex.org/W2068181924","https://openalex.org/W2088513386","https://openalex.org/W2097521684","https://openalex.org/W2097726431","https://openalex.org/W2101234009","https://openalex.org/W2113321055","https://openalex.org/W2114204486","https://openalex.org/W2134169864","https://openalex.org/W2137036358","https://openalex.org/W2147167010","https://openalex.org/W2148506018","https://openalex.org/W2165066692","https://openalex.org/W2171468534","https://openalex.org/W2250302982","https://openalex.org/W2997591727","https://openalex.org/W3098780114","https://openalex.org/W3123712780","https://openalex.org/W4205184193","https://openalex.org/W4285511343","https://openalex.org/W4300391517","https://openalex.org/W6639024449","https://openalex.org/W6691180351"],"related_works":["https://openalex.org/W3122845461","https://openalex.org/W3125380173","https://openalex.org/W3124164994","https://openalex.org/W4388281457","https://openalex.org/W4285890971","https://openalex.org/W4400439062","https://openalex.org/W3125898096","https://openalex.org/W1568456066","https://openalex.org/W3122679999","https://openalex.org/W1990819141"],"abstract_inverted_index":{"Information":[0],"extracted":[1],"from":[2,20,241],"social":[3,37,99,150],"media":[4,38,100],"streams":[5,101],"has":[6],"been":[7],"leveraged":[8,61],"to":[9,23,43,79,102,154,179,225],"forecast":[10],"the":[11,34,44,47,107,124,146,159,198,206,212,219,242,255,276,282],"outcome":[12],"of":[13,17,30,36,46,109,123,149,228,261],"a":[14,68,93,141,226],"large":[15],"number":[16],"real-world":[18],"events,":[19],"political":[21],"elections":[22],"stock":[24],"market":[25],"fluctuations.":[26],"An":[27],"increasing":[28],"amount":[29],"studies":[31],"demonstrates":[32],"how":[33,75],"analysis":[35,191],"conversations":[39,256],"provides":[40,222],"cheap":[41],"access":[42],"wisdom":[45],"crowd.":[48],"However,":[49],"extents":[50],"and":[51,105,152,192,218,248,273,275,288],"contexts":[52],"in":[53,67,114,118],"which":[54,119],"such":[55,156,167],"forecasting":[56],"power":[57,148,157],"can":[58],"be":[59],"effectively":[60],"are":[62],"still":[63],"unverified":[64],"at":[65,120],"least":[66,121],"systematic":[69,142],"way.":[70],"It":[71],"is":[72,127,186],"also":[73],"unclear":[74],"social-media-based":[76],"predictions":[77],"compare":[78,155],"those":[80],"based":[81,187],"on":[82,116,188],"alternative":[83],"information":[84],"sources.":[85,165],"To":[86,231],"address":[87],"these":[88],"issues,":[89],"here":[90],"we":[91,235],"develop":[92],"machine":[94],"learning":[95,213],"framework":[96,171,234],"that":[97,137],"leverages":[98],"automatically":[103],"identify":[104],"predict":[106],"outcomes":[108,126],"soccer":[110,259],"matches.":[111],"We":[112,135,204],"focus":[113],"particular":[115],"matches":[117,260],"one":[122],"possible":[125],"deemed":[128],"as":[129,223],"highly":[130],"unlikely":[131],"by":[132,163,253],"professional":[133],"bookmakers.":[134],"argue":[136],"sport":[138],"events":[139],"offer":[140],"approach":[143],"for":[144,201],"testing":[145],"predictive":[147],"media,":[151],"allow":[153],"against":[158],"rigorous":[160],"baselines":[161],"set":[162,227],"external":[164],"Despite":[166],"strict":[168],"baselines,":[169],"our":[170,209,233],"yields":[172],"above":[173],"8%":[174],"marginal":[175],"profit":[176],"when":[177],"used":[178],"inform":[180],"simple":[181],"betting":[182,229],"strategies.":[183,230],"The":[184],"system":[185],"real-time":[189,249],"sentiment":[190],"exploits":[193],"data":[194,240,251],"collected":[195,252],"immediately":[196],"before":[197],"games,":[199,247],"allowing":[200],"informed":[202],"bets.":[203],"discuss":[205],"rationale":[207],"behind":[208],"approach,":[210],"describe":[211],"framework,":[214],"its":[215],"prediction":[216],"performance":[217],"return":[220],"it":[221],"compared":[224],"test":[232],"use":[236],"both":[237],"historical":[238],"Twitter":[239,250],"2014":[243,277,287],"FIFA":[244],"World":[245],"Cup":[246],"monitoring":[254],"about":[257],"all":[258],"four":[262],"major":[263],"European":[264],"tournaments":[265],"(FA":[266],"Premier":[267],"League,":[268,280],"Serie":[269],"A,":[270],"La":[271],"Liga,":[272],"Bundesliga),":[274],"UEFA":[278],"Champions":[279],"during":[281],"period":[283],"between":[284],"Oct.":[285],"25th":[286],"Nov.":[289],"26th":[290],"2014.":[291]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":1},{"year":2015,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2022-10-01T00:00:00"}
