{"id":"https://openalex.org/W4399729437","doi":"https://doi.org/10.1109/syscon61195.2024.10553540","title":"Comparison of Common Crawl News &amp; GDELT","display_name":"Comparison of Common Crawl News &amp; GDELT","publication_year":2024,"publication_date":"2024-04-15","ids":{"openalex":"https://openalex.org/W4399729437","doi":"https://doi.org/10.1109/syscon61195.2024.10553540"},"language":"en","primary_location":{"id":"doi:10.1109/syscon61195.2024.10553540","is_oa":false,"landing_page_url":"https://doi.org/10.1109/syscon61195.2024.10553540","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Systems Conference (SysCon)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5099161875","display_name":"Ameir El Ouadi","orcid":null},"institutions":[{"id":"https://openalex.org/I192545095","display_name":"United States Military Academy","ror":"https://ror.org/01jepya76","country_code":"US","type":"education","lineage":["https://openalex.org/I1304082316","https://openalex.org/I1330347796","https://openalex.org/I192545095","https://openalex.org/I4210088792"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Ameir El Ouadi","raw_affiliation_strings":["United States Military Academy,Department of Systems Engineering,West Point,NY,USA","Department of Systems Engineering, United States Military Academy, West Point, NY, USA"],"affiliations":[{"raw_affiliation_string":"United States Military Academy,Department of Systems Engineering,West Point,NY,USA","institution_ids":["https://openalex.org/I192545095"]},{"raw_affiliation_string":"Department of Systems Engineering, United States Military Academy, West Point, NY, USA","institution_ids":["https://openalex.org/I192545095"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5063173613","display_name":"David M. Beskow","orcid":"https://orcid.org/0000-0003-2814-8712"},"institutions":[{"id":"https://openalex.org/I192545095","display_name":"United States Military Academy","ror":"https://ror.org/01jepya76","country_code":"US","type":"education","lineage":["https://openalex.org/I1304082316","https://openalex.org/I1330347796","https://openalex.org/I192545095","https://openalex.org/I4210088792"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"David Beskow","raw_affiliation_strings":["United States Military Academy,Department of Systems Engineering,West Point,NY,USA","Department of Systems Engineering, United States Military Academy, West Point, NY, USA"],"affiliations":[{"raw_affiliation_string":"United States Military Academy,Department of Systems Engineering,West Point,NY,USA","institution_ids":["https://openalex.org/I192545095"]},{"raw_affiliation_string":"Department of Systems Engineering, United States Military Academy, West Point, NY, USA","institution_ids":["https://openalex.org/I192545095"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5099161875"],"corresponding_institution_ids":["https://openalex.org/I192545095"],"apc_list":null,"apc_paid":null,"fwci":1.6284,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.86323772,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"3"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12034","display_name":"Digital and Cyber Forensics","score":0.9854000210762024,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12034","display_name":"Digital and Cyber Forensics","score":0.9854000210762024,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9692999720573425,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.958299994468689,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.576676070690155},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.32216453552246094}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.576676070690155},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.32216453552246094}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/syscon61195.2024.10553540","is_oa":false,"landing_page_url":"https://doi.org/10.1109/syscon61195.2024.10553540","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Systems Conference (SysCon)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W22264387","https://openalex.org/W317797172","https://openalex.org/W1889043906","https://openalex.org/W2022995284","https://openalex.org/W2129693401","https://openalex.org/W2140948436","https://openalex.org/W2170716095","https://openalex.org/W2250653840","https://openalex.org/W2294420157","https://openalex.org/W2612186099","https://openalex.org/W2626653630","https://openalex.org/W3094045953","https://openalex.org/W3174269049","https://openalex.org/W6611038622","https://openalex.org/W6691892052"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052","https://openalex.org/W2382290278","https://openalex.org/W4395014643"],"abstract_inverted_index":{"The":[0],"corpus":[1,22],"of":[2,54,71],"worldwide":[3],"news":[4,43,88,97,119],"is":[5,23],"important":[6,24],"for":[7,25,46],"natural":[8],"language":[9,14],"processing,":[10],"knowledge":[11],"graphs,":[12],"large":[13],"models,":[15],"and":[16,31,57,60,69,77,86],"other":[17],"technical":[18],"efforts.":[19],"Additionally,":[20],"this":[21],"understanding":[26],"the":[27,51,67,91,101,114],"people,":[28],"places,":[29],"organizations,":[30],"events":[32],"that":[33],"interact":[34],"in":[35,112],"real-time":[36],"every":[37],"day.":[38],"This":[39],"paper":[40],"compares":[41],"two":[42,115],"datasets":[44,116],"used":[45],"these":[47],"tasks":[48],"today,":[49],"namely":[50],"Global":[52],"Database":[53],"Events,":[55],"Language,":[56],"Tone":[58],"(GDELT)":[59],"Common":[61,93],"Crawl":[62,94],"News.":[63],"Our":[64,107],"research":[65],"highlights":[66],"strengths":[68],"limitations":[70],"each":[72],"dataset,":[73],"analyzing":[74],"their":[75,118],"content":[76],"coverage.":[78],"Notably,":[79],"while":[80],"GDELT":[81],"relies":[82],"on":[83,96],"broadcasts,":[84],"prints,":[85],"web":[87,105],"from":[89,99],"across":[90],"globe,":[92],"focuses":[95],"sites":[98],"around":[100],"world":[102],"gathered":[103],"through":[104],"crawling.":[106],"analysis":[108],"revealed":[109],"considerable":[110],"differences":[111],"where":[113],"gather":[117],"sources.":[120]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
