{"id":"https://openalex.org/W2769324101","doi":"https://doi.org/10.1145/3110025.3110110","title":"Mining Frequency of Drug Side Effects over a Large Twitter Dataset Using Apache Spark","display_name":"Mining Frequency of Drug Side Effects over a Large Twitter Dataset Using Apache Spark","publication_year":2017,"publication_date":"2017-07-31","ids":{"openalex":"https://openalex.org/W2769324101","doi":"https://doi.org/10.1145/3110025.3110110","mag":"2769324101"},"language":"en","primary_location":{"id":"doi:10.1145/3110025.3110110","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3110025.3110110","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2017 IEEE/ACM International Conference on Advances in Social Networks Analysis and Mining 2017","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5019790871","display_name":"Dennis Hsu","orcid":null},"institutions":[{"id":"https://openalex.org/I51504820","display_name":"San Jose State University","ror":"https://ror.org/04qyvz380","country_code":"US","type":"education","lineage":["https://openalex.org/I51504820"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Dennis Hsu","raw_affiliation_strings":["Department of Computer Science, San Jose State University, San Jose, CA, U.S.A"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, San Jose State University, San Jose, CA, U.S.A","institution_ids":["https://openalex.org/I51504820"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021884742","display_name":"Melody Moh","orcid":"https://orcid.org/0000-0002-8313-6645"},"institutions":[{"id":"https://openalex.org/I51504820","display_name":"San Jose State University","ror":"https://ror.org/04qyvz380","country_code":"US","type":"education","lineage":["https://openalex.org/I51504820"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Melody Moh","raw_affiliation_strings":["Department of Computer Science, San Jose State University, San Jose, CA, U.S.A"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, San Jose State University, San Jose, CA, U.S.A","institution_ids":["https://openalex.org/I51504820"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5019298277","display_name":"Teng-Sheng Moh","orcid":"https://orcid.org/0000-0002-2726-102X"},"institutions":[{"id":"https://openalex.org/I51504820","display_name":"San Jose State University","ror":"https://ror.org/04qyvz380","country_code":"US","type":"education","lineage":["https://openalex.org/I51504820"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Teng-Sheng Moh","raw_affiliation_strings":["Department of Computer Science, San Jose State University, San Jose, CA, U.S.A"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, San Jose State University, San Jose, CA, U.S.A","institution_ids":["https://openalex.org/I51504820"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5019790871"],"corresponding_institution_ids":["https://openalex.org/I51504820"],"apc_list":null,"apc_paid":null,"fwci":1.1852,"has_fulltext":false,"cited_by_count":11,"citation_normalized_percentile":{"value":0.817504,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"915","last_page":"924"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9864000082015991,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":0.9814000129699707,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/spark","display_name":"SPARK (programming language)","score":0.726203203201294},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6693257689476013},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.6086422204971313},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.5600895881652832},{"id":"https://openalex.org/keywords/sentiment-analysis","display_name":"Sentiment analysis","score":0.5537732243537903},{"id":"https://openalex.org/keywords/side-effect","display_name":"Side effect (computer science)","score":0.5537015795707703},{"id":"https://openalex.org/keywords/social-media","display_name":"Social media","score":0.515882134437561},{"id":"https://openalex.org/keywords/drug","display_name":"Drug","score":0.4744090735912323},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.4465218186378479},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4441301226615906},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.4408474862575531},{"id":"https://openalex.org/keywords/side-channel-attack","display_name":"Side channel attack","score":0.43458572030067444},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4250560402870178},{"id":"https://openalex.org/keywords/pipeline-transport","display_name":"Pipeline transport","score":0.415219783782959},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.32789358496665955},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.21542391180992126},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.19280949234962463},{"id":"https://openalex.org/keywords/medicine","display_name":"Medicine","score":0.18909427523612976},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.15376907587051392},{"id":"https://openalex.org/keywords/pharmacology","display_name":"Pharmacology","score":0.12860536575317383}],"concepts":[{"id":"https://openalex.org/C2781215313","wikidata":"https://www.wikidata.org/wiki/Q3493345","display_name":"SPARK (programming language)","level":2,"score":0.726203203201294},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6693257689476013},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.6086422204971313},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.5600895881652832},{"id":"https://openalex.org/C66402592","wikidata":"https://www.wikidata.org/wiki/Q2271421","display_name":"Sentiment analysis","level":2,"score":0.5537732243537903},{"id":"https://openalex.org/C3454156","wikidata":"https://www.wikidata.org/wiki/Q1144241","display_name":"Side effect (computer science)","level":2,"score":0.5537015795707703},{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.515882134437561},{"id":"https://openalex.org/C2780035454","wikidata":"https://www.wikidata.org/wiki/Q8386","display_name":"Drug","level":2,"score":0.4744090735912323},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.4465218186378479},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4441301226615906},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.4408474862575531},{"id":"https://openalex.org/C49289754","wikidata":"https://www.wikidata.org/wiki/Q2267081","display_name":"Side channel attack","level":3,"score":0.43458572030067444},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4250560402870178},{"id":"https://openalex.org/C175309249","wikidata":"https://www.wikidata.org/wiki/Q725864","display_name":"Pipeline transport","level":2,"score":0.415219783782959},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.32789358496665955},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.21542391180992126},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.19280949234962463},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.18909427523612976},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.15376907587051392},{"id":"https://openalex.org/C98274493","wikidata":"https://www.wikidata.org/wiki/Q128406","display_name":"Pharmacology","level":1,"score":0.12860536575317383},{"id":"https://openalex.org/C178489894","wikidata":"https://www.wikidata.org/wiki/Q8789","display_name":"Cryptography","level":2,"score":0.0},{"id":"https://openalex.org/C87717796","wikidata":"https://www.wikidata.org/wiki/Q146326","display_name":"Environmental engineering","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1145/3110025.3110110","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3110025.3110110","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2017 IEEE/ACM International Conference on Advances in Social Networks Analysis and Mining 2017","raw_type":"proceedings-article"},{"id":"pmh:oai:scholarworks.sjsu.edu:etd_projects-1549","is_oa":false,"landing_page_url":"https://scholarworks.sjsu.edu/etd_projects/549","pdf_url":null,"source":{"id":"https://openalex.org/S4377196389","display_name":"San Jos\u00e9 State University ScholarWorks (San Jose State University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I51504820","host_organization_name":"San Jose State University","host_organization_lineage":["https://openalex.org/I51504820"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Master's Projects","raw_type":"text"},{"id":"pmh:oai:scholarworks.sjsu.edu:etd_projects-1571","is_oa":false,"landing_page_url":"https://scholarworks.sjsu.edu/etd_projects/570","pdf_url":null,"source":{"id":"https://openalex.org/S4377196389","display_name":"San Jos\u00e9 State University ScholarWorks (San Jose State University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I51504820","host_organization_name":"San Jose State University","host_organization_lineage":["https://openalex.org/I51504820"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Master's Projects","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Good health and well-being","score":0.5199999809265137,"id":"https://metadata.un.org/sdg/3"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W177032395","https://openalex.org/W193524605","https://openalex.org/W1533946607","https://openalex.org/W1550258693","https://openalex.org/W1599730737","https://openalex.org/W1743243001","https://openalex.org/W1996430422","https://openalex.org/W2101234009","https://openalex.org/W2111975591","https://openalex.org/W2131975293","https://openalex.org/W2139212933","https://openalex.org/W2209293842","https://openalex.org/W2293502436","https://openalex.org/W2293903219","https://openalex.org/W2397292972","https://openalex.org/W2461345536","https://openalex.org/W2548865325","https://openalex.org/W2554028040","https://openalex.org/W2596834559","https://openalex.org/W2614252098","https://openalex.org/W2950974174","https://openalex.org/W2963288913","https://openalex.org/W2963891150","https://openalex.org/W2997591727","https://openalex.org/W3152231500","https://openalex.org/W3193477162","https://openalex.org/W4233906183","https://openalex.org/W4243217122","https://openalex.org/W4247144487","https://openalex.org/W4292550096","https://openalex.org/W6614148910","https://openalex.org/W6632118081"],"related_works":["https://openalex.org/W2548633793","https://openalex.org/W3013279174","https://openalex.org/W2941935829","https://openalex.org/W4323824501","https://openalex.org/W2596247554","https://openalex.org/W1975949872","https://openalex.org/W3159871278","https://openalex.org/W2230552005","https://openalex.org/W2905242764","https://openalex.org/W3132372214"],"abstract_inverted_index":{"Despite":[0],"clinical":[1],"trials":[2],"by":[3,159],"pharmaceutical":[4],"companies":[5],"as":[6,8,48,62,162,164],"well":[7,163],"current":[9,42],"FDA":[10],"reporting":[11],"systems,":[12],"there":[13],"are":[14],"still":[15],"drug":[16,65,178,233],"side":[17,66,102,126,135,179,198,234],"effects":[18,136,180,199,235],"that":[19],"have":[20,87,105,142,228],"not":[21],"been":[22],"caught.":[23],"To":[24,68],"find":[25],"a":[26,31,108,113,182,190],"larger":[27],"sample":[28],"of":[29,56,115,123,155,157,169,177,200,209,213],"reports,":[30],"possible":[32],"way":[33],"is":[34,137],"to":[35,53,119,151,165],"mine":[36],"online":[37],"social":[38,45],"media.":[39],"With":[40],"its":[41],"widespread":[43],"use,":[44],"media":[46],"such":[47],"Twitter":[49],"has":[50,75],"given":[51],"rise":[52],"massive":[54],"amounts":[55],"data,":[57],"which":[58],"can":[59],"be":[60],"used":[61],"reports":[63],"for":[64,78,133,185],"effects.":[67,103,127],"process":[69,168],"these":[70],"large":[71,170],"datasets,":[72],"Apache":[73,149],"Spark":[74,150],"become":[76],"popular":[77],"fast,":[79],"distributed":[80],"batch":[81],"processing.":[82],"In":[83,128],"this":[84,194,225],"work,":[85],"we":[86,141,188],"improved":[88],"on":[89,193,231,237],"previous":[90],"pipelines":[91],"in":[92,148,224,241],"sentimental":[93],"analysis-based":[94],"mining,":[95],"processing,":[96],"and":[97,205,220,236],"extracting":[98],"tweets":[99,158],"with":[100],"drug-caused":[101,125],"We":[104,215],"also":[106,138,143],"added":[107],"new":[109],"ensemble":[110],"classifier":[111],"using":[112,202,210],"combination":[114,212],"sentiment":[116],"analysis":[117,240],"features":[118],"increase":[120],"the":[121,130,134,145,153,167,174,197,206,217,221],"accuracy":[122],"identifying":[124],"addition,":[129],"frequency":[131,175],"count":[132,176],"provided.":[139],"Furthermore,":[140],"implemented":[144],"same":[146],"pipeline":[147,218],"improve":[152],"speed":[154],"processing":[156],"2.5":[160],"times,":[161],"support":[166],"tweet":[171],"datasets.":[172],"As":[173],"opens":[181],"wide":[183],"door":[184],"further":[186],"analysis,":[187],"present":[189,223],"preliminary":[191],"study":[192],"issue,":[195],"including":[196],"simultaneously":[201],"two":[203],"drugs,":[204],"potential":[207],"danger":[208],"less-common":[211],"drugs.":[214],"believe":[216],"design":[219],"results":[222],"work":[226],"would":[227],"great":[229],"implication":[230],"studying":[232],"big":[238],"data":[239],"general.":[242]},"counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":1}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
