{"id":"https://openalex.org/W4284878731","doi":"https://doi.org/10.1145/3547146","title":"Using Machine Learning to Enhance Archival Processing of Social Media Archives","display_name":"Using Machine Learning to Enhance Archival Processing of Social Media Archives","publication_year":2022,"publication_date":"2022-07-08","ids":{"openalex":"https://openalex.org/W4284878731","doi":"https://doi.org/10.1145/3547146"},"language":"en","primary_location":{"id":"doi:10.1145/3547146","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3547146","pdf_url":null,"source":{"id":"https://openalex.org/S4210184050","display_name":"Journal on Computing and Cultural Heritage","issn_l":"1556-4673","issn":["1556-4673","1556-4711"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal on Computing and Cultural Heritage","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5070395413","display_name":"Lizhou Fan","orcid":"https://orcid.org/0000-0002-7962-9113"},"institutions":[{"id":"https://openalex.org/I27837315","display_name":"University of Michigan\u2013Ann Arbor","ror":"https://ror.org/00jmfr291","country_code":"US","type":"education","lineage":["https://openalex.org/I27837315"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Lizhou Fan","raw_affiliation_strings":["University of Michigan, Ann Arbor, MI"],"affiliations":[{"raw_affiliation_string":"University of Michigan, Ann Arbor, MI","institution_ids":["https://openalex.org/I27837315"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066911623","display_name":"Zhanyuan Yin","orcid":"https://orcid.org/0000-0002-4561-9566"},"institutions":[{"id":"https://openalex.org/I40347166","display_name":"University of Chicago","ror":"https://ror.org/024mw5h28","country_code":"US","type":"education","lineage":["https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhanyuan Yin","raw_affiliation_strings":["The University of Chicago, Chicago, IL"],"affiliations":[{"raw_affiliation_string":"The University of Chicago, Chicago, IL","institution_ids":["https://openalex.org/I40347166"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005046138","display_name":"Huizi Yu","orcid":"https://orcid.org/0000-0003-3776-9211"},"institutions":[{"id":"https://openalex.org/I27804330","display_name":"Brown University","ror":"https://ror.org/05gq02987","country_code":"US","type":"education","lineage":["https://openalex.org/I27804330"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Huizi Yu","raw_affiliation_strings":["Brown University, Providence, RI"],"affiliations":[{"raw_affiliation_string":"Brown University, Providence, RI","institution_ids":["https://openalex.org/I27804330"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5075849118","display_name":"Anne J. Gilliland","orcid":"https://orcid.org/0000-0002-4897-7780"},"institutions":[{"id":"https://openalex.org/I161318765","display_name":"University of California, Los Angeles","ror":"https://ror.org/046rm7j60","country_code":"US","type":"education","lineage":["https://openalex.org/I161318765"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Anne J. Gilliland","raw_affiliation_strings":["University of California, Los Angeles, CA"],"affiliations":[{"raw_affiliation_string":"University of California, Los Angeles, CA","institution_ids":["https://openalex.org/I161318765"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5070395413"],"corresponding_institution_ids":["https://openalex.org/I27837315"],"apc_list":null,"apc_paid":null,"fwci":0.5305,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.70254091,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"15","issue":"3","first_page":"1","last_page":"23"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10557","display_name":"Social Media and Politics","score":0.9545000195503235,"subfield":{"id":"https://openalex.org/subfields/3315","display_name":"Communication"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9169999957084656,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7362308502197266},{"id":"https://openalex.org/keywords/social-media","display_name":"Social media","score":0.6452862620353699},{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.6051344871520996},{"id":"https://openalex.org/keywords/analytics","display_name":"Analytics","score":0.6047185659408569},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.5212934017181396},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4632471799850464},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.4613744020462036},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.43861329555511475},{"id":"https://openalex.org/keywords/public-opinion","display_name":"Public opinion","score":0.4130541980266571},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.39577212929725647},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.1439422369003296},{"id":"https://openalex.org/keywords/politics","display_name":"Politics","score":0.1334713101387024}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7362308502197266},{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.6452862620353699},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.6051344871520996},{"id":"https://openalex.org/C79158427","wikidata":"https://www.wikidata.org/wiki/Q485396","display_name":"Analytics","level":2,"score":0.6047185659408569},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.5212934017181396},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4632471799850464},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.4613744020462036},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.43861329555511475},{"id":"https://openalex.org/C134698397","wikidata":"https://www.wikidata.org/wiki/Q17946","display_name":"Public opinion","level":3,"score":0.4130541980266571},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.39577212929725647},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.1439422369003296},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.1334713101387024},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3547146","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3547146","pdf_url":null,"source":{"id":"https://openalex.org/S4210184050","display_name":"Journal on Computing and Cultural Heritage","issn_l":"1556-4673","issn":["1556-4673","1556-4711"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal on Computing and Cultural Heritage","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6100000143051147,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":56,"referenced_works":["https://openalex.org/W80056832","https://openalex.org/W970764947","https://openalex.org/W1536381417","https://openalex.org/W1594865592","https://openalex.org/W1595640372","https://openalex.org/W1819662813","https://openalex.org/W1820476779","https://openalex.org/W1857951938","https://openalex.org/W1883443290","https://openalex.org/W1973833378","https://openalex.org/W1988706181","https://openalex.org/W2009169253","https://openalex.org/W2071653415","https://openalex.org/W2156580264","https://openalex.org/W2180404376","https://openalex.org/W2195118991","https://openalex.org/W2311430799","https://openalex.org/W2473555522","https://openalex.org/W2564933006","https://openalex.org/W2575439561","https://openalex.org/W2595653137","https://openalex.org/W2741065173","https://openalex.org/W2758474413","https://openalex.org/W2764072425","https://openalex.org/W2767269108","https://openalex.org/W2777311577","https://openalex.org/W2784209217","https://openalex.org/W2897231284","https://openalex.org/W2898970033","https://openalex.org/W2963146848","https://openalex.org/W2963481894","https://openalex.org/W2963790884","https://openalex.org/W2975209231","https://openalex.org/W2990929101","https://openalex.org/W2997717978","https://openalex.org/W3003646990","https://openalex.org/W3008632661","https://openalex.org/W3011720243","https://openalex.org/W3029151080","https://openalex.org/W3033229567","https://openalex.org/W3034078763","https://openalex.org/W3035484701","https://openalex.org/W3037134736","https://openalex.org/W3040772153","https://openalex.org/W3041501620","https://openalex.org/W3094479746","https://openalex.org/W3103145424","https://openalex.org/W3122929941","https://openalex.org/W3124443940","https://openalex.org/W3136869059","https://openalex.org/W3196353406","https://openalex.org/W3205176231","https://openalex.org/W4233786305","https://openalex.org/W4320013936","https://openalex.org/W6638208828","https://openalex.org/W6731479946"],"related_works":["https://openalex.org/W2767450342","https://openalex.org/W4295151157","https://openalex.org/W2470196046","https://openalex.org/W2285821375","https://openalex.org/W3148030980","https://openalex.org/W4320063470","https://openalex.org/W2785337750","https://openalex.org/W2730929352","https://openalex.org/W2887671051","https://openalex.org/W4298858166"],"abstract_inverted_index":{"This":[0],"article":[1],"reports":[2],"on":[3,53],"a":[4,48],"study":[5,51],"using":[6,87],"machine":[7,102],"learning":[8,103],"to":[9,60,100,107,174],"identify":[10],"incidences":[11],"and":[12,33,41,68,72,82,104,109,114,155,160,170,178],"shifting":[13],"dynamics":[14],"of":[15,151],"hate":[16,85],"speech":[17,86],"in":[18,128,163],"social":[19,116],"media":[20,117],"archives.":[21],"To":[22],"better":[23],"cope":[24],"with":[25],"the":[26,39,75,88,152],"archival":[27,153],"processing":[28],"need":[29],"for":[30,84,125,132,139,147],"such":[31],"large-scale":[32],"fast":[34],"evolving":[35],"archives,":[36],"we":[37],"propose":[38],"Data-driven":[40],"Circulating":[42],"Archival":[43],"Processing":[44],"(DCAP)":[45],"method.":[46,93],"As":[47],"proof-of-concept,":[49],"our":[50],"focuses":[52],"an":[54],"English":[55],"language":[56],"Twitter":[57,79],"archive":[58],"relating":[59],"COVID-19:":[61],"Tweets":[62],"were":[63],"repeatedly":[64],"scraped":[65],"between":[66],"February":[67],"June":[69],"2020,":[70],"ingested":[71],"aggregated":[73],"within":[74],"COVID-19":[76],"Hate":[77],"Speech":[78],"Archive":[80],"(CHSTA),":[81],"analyzed":[83],"Generative":[89],"Adversarial":[90],"Network\u2013inspired":[91],"DCAP":[92],"Outcomes":[94],"suggest":[95],"that":[96,119,165],"it":[97],"is":[98],"possible":[99],"use":[101],"data":[105],"analytics":[106],"surface":[108],"substantiate":[110],"trends":[111],"from":[112],"CHSTA":[113],"similar":[115],"archives":[118],"could":[120],"provide":[121],"immediately":[122],"useful":[123],"knowledge":[124],"crisis":[126],"response,":[127],"controversial":[129],"situations,":[130],"or":[131],"public":[133],"policy":[134],"development,":[135],"as":[136,138],"well":[137],"subsequent":[140],"historical":[141],"analysis.":[142],"The":[143],"approach":[144],"shows":[145],"potential":[146],"integrating":[148],"multiple":[149],"aspects":[150],"workflow":[154],"supporting":[156],"automatic":[157],"iterative":[158],"redescription":[159],"reappraisal":[161],"activities":[162],"ways":[164],"make":[166],"them":[167],"more":[168,171],"accountable":[169],"rapidly":[172],"responsive":[173],"changing":[175],"societal":[176],"interests":[177],"unfolding":[179],"developments.":[180]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
