{"id":"https://openalex.org/W3006737784","doi":"https://doi.org/10.1109/bigdata47090.2019.9006049","title":"Mining News Events from Comparable News Corpora: A Multi-Attribute Proximity Network Modeling Approach","display_name":"Mining News Events from Comparable News Corpora: A Multi-Attribute Proximity Network Modeling Approach","publication_year":2019,"publication_date":"2019-12-01","ids":{"openalex":"https://openalex.org/W3006737784","doi":"https://doi.org/10.1109/bigdata47090.2019.9006049","mag":"3006737784"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata47090.2019.9006049","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata47090.2019.9006049","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5074265179","display_name":"Hyungsul Kim","orcid":null},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Hyungsul Kim","raw_affiliation_strings":["The University of Illinois at Urbana-Champaign"],"affiliations":[{"raw_affiliation_string":"The University of Illinois at Urbana-Champaign","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035119055","display_name":"Ahmed El-Kishky","orcid":"https://orcid.org/0000-0003-0121-7781"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ahmed El-Kishky","raw_affiliation_strings":["The University of Illinois at Urbana-Champaign"],"affiliations":[{"raw_affiliation_string":"The University of Illinois at Urbana-Champaign","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009408707","display_name":"Xiang Ren","orcid":"https://orcid.org/0000-0001-8655-663X"},"institutions":[{"id":"https://openalex.org/I2800817003","display_name":"Southern California University for Professional Studies","ror":"https://ror.org/058zz0t50","country_code":"US","type":"education","lineage":["https://openalex.org/I2800817003"]},{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xiang Ren","raw_affiliation_strings":["University of Southern California"],"affiliations":[{"raw_affiliation_string":"University of Southern California","institution_ids":["https://openalex.org/I2800817003","https://openalex.org/I1174212"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5019539533","display_name":"Jiawei Han","orcid":"https://orcid.org/0000-0002-3629-2696"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jiawei Han","raw_affiliation_strings":["The University of Illinois at Urbana-Champaign"],"affiliations":[{"raw_affiliation_string":"The University of Illinois at Urbana-Champaign","institution_ids":["https://openalex.org/I157725225"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5074265179"],"corresponding_institution_ids":["https://openalex.org/I157725225"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.19654576,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"105","last_page":"114"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.995199978351593,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.995199978351593,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9943000078201294,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9936000108718872,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/automatic-summarization","display_name":"Automatic summarization","score":0.8242166042327881},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8241815567016602},{"id":"https://openalex.org/keywords/event","display_name":"Event (particle physics)","score":0.6990102529525757},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5650435090065002},{"id":"https://openalex.org/keywords/regularization","display_name":"Regularization (linguistics)","score":0.4908974766731262},{"id":"https://openalex.org/keywords/topic-model","display_name":"Topic model","score":0.4850872755050659},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4624950885772705},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.42189300060272217},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3413313925266266}],"concepts":[{"id":"https://openalex.org/C170858558","wikidata":"https://www.wikidata.org/wiki/Q1394144","display_name":"Automatic summarization","level":2,"score":0.8242166042327881},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8241815567016602},{"id":"https://openalex.org/C2779662365","wikidata":"https://www.wikidata.org/wiki/Q5416694","display_name":"Event (particle physics)","level":2,"score":0.6990102529525757},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5650435090065002},{"id":"https://openalex.org/C2776135515","wikidata":"https://www.wikidata.org/wiki/Q17143721","display_name":"Regularization (linguistics)","level":2,"score":0.4908974766731262},{"id":"https://openalex.org/C171686336","wikidata":"https://www.wikidata.org/wiki/Q3532085","display_name":"Topic model","level":2,"score":0.4850872755050659},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4624950885772705},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42189300060272217},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3413313925266266},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigdata47090.2019.9006049","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata47090.2019.9006049","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":45,"referenced_works":["https://openalex.org/W30314283","https://openalex.org/W1579579982","https://openalex.org/W1630641096","https://openalex.org/W1975879668","https://openalex.org/W1982008367","https://openalex.org/W2015370225","https://openalex.org/W2029915058","https://openalex.org/W2034707531","https://openalex.org/W2041590596","https://openalex.org/W2046902062","https://openalex.org/W2048030219","https://openalex.org/W2052635433","https://openalex.org/W2066727938","https://openalex.org/W2085715652","https://openalex.org/W2097005391","https://openalex.org/W2098057544","https://openalex.org/W2102563561","https://openalex.org/W2103096174","https://openalex.org/W2107610218","https://openalex.org/W2108706252","https://openalex.org/W2112382532","https://openalex.org/W2123661878","https://openalex.org/W2124499489","https://openalex.org/W2127492100","https://openalex.org/W2147566544","https://openalex.org/W2149781590","https://openalex.org/W2150815390","https://openalex.org/W2154587273","https://openalex.org/W2165389462","https://openalex.org/W2168175751","https://openalex.org/W2171150534","https://openalex.org/W2223881431","https://openalex.org/W2339912288","https://openalex.org/W2375543500","https://openalex.org/W2425146075","https://openalex.org/W3140453591","https://openalex.org/W4231510805","https://openalex.org/W6601179756","https://openalex.org/W6636356626","https://openalex.org/W6639619044","https://openalex.org/W6657904428","https://openalex.org/W6674746900","https://openalex.org/W6675420493","https://openalex.org/W6681794421","https://openalex.org/W6682709453"],"related_works":["https://openalex.org/W2366403280","https://openalex.org/W1495108544","https://openalex.org/W2091301346","https://openalex.org/W3148229873","https://openalex.org/W4389760904","https://openalex.org/W2150160875","https://openalex.org/W4242223894","https://openalex.org/W4306886878","https://openalex.org/W2973759123","https://openalex.org/W1517524280"],"abstract_inverted_index":{"We":[0,85,133],"present":[1],"ProxiModel,":[2],"a":[3,54,56,92,157,165],"novel":[4,57],"event":[5,12,34,64,76,78,129,147],"mining":[6],"framework":[7,142],"for":[8,74,164],"extracting":[9],"high-quality":[10,106,128],"structured":[11],"knowledge":[13],"from":[14,27,139],"large,":[15],"redundant,":[16],"and":[17,103,107,124,131,149,170],"noisy":[18],"news":[19,109,115,145,168,178],"data":[20,59],"sources.":[21],"The":[22],"proposed":[23,120,141],"model":[24,87],"differentiates":[25],"itself":[26],"other":[28],"approaches":[29],"by":[30],"modeling":[31],"both":[32],"the":[33,44,51,70,88,119,162],"correlation":[35],"within":[36],"each":[37],"individual":[38],"document":[39],"as":[40,42,80,82,91,144],"well":[41,81],"across":[43],"corpus.":[45],"To":[46],"facilitate":[47,62],"this,":[48],"we":[49,155],"introduce":[50],"concept":[52],"of":[53],"proximity-network,":[55],"space-efficient":[58],"structure":[60],"to":[61,101,174],"scalable":[63],"mining.":[65],"This":[66,98],"proximity":[67,89],"network":[68,90],"captures":[69],"corpus-level":[71],"co-occurence":[72],"statistics":[73],"candidate":[75],"descriptors,":[77],"attributes,":[79],"their":[83],"connections.":[84],"probabilistically":[86],"generative":[93],"process":[94],"with":[95],"sparsity-inducing":[96],"regularization.":[97],"allows":[99],"us":[100],"efficiently":[102],"effectively":[104],"extract":[105],"interpretable":[108],"events.":[110,179],"Experiments":[111],"on":[112,152,160],"three":[113],"different":[114],"corpora":[116],"demonstrate":[117,171],"that":[118],"method":[121],"is":[122],"effective":[123],"robust":[125],"at":[126],"generating":[127],"descriptors":[130],"attributes.":[132],"briefly":[134],"detail":[135],"many":[136],"interesting":[137],"applications":[138],"our":[140],"such":[143],"summarization,":[146],"tracking":[148],"multi-dimensional":[150],"analysis":[151],"news.":[153],"Finally,":[154],"explore":[156],"case":[158],"study":[159],"visualizing":[161],"events":[163],"Japan":[166],"Tsunami":[167],"corpus":[169],"ProxiModel's":[172],"ability":[173],"automatically":[175],"summarize":[176],"emerging":[177]},"counts_by_year":[{"year":2023,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
