{"id":"https://openalex.org/W2196958957","doi":"https://doi.org/10.1109/bigdata.2015.7363938","title":"A method for cross-document narrative alignment of a two-hundred-sixty-million word corpus","display_name":"A method for cross-document narrative alignment of a two-hundred-sixty-million word corpus","publication_year":2015,"publication_date":"2015-10-01","ids":{"openalex":"https://openalex.org/W2196958957","doi":"https://doi.org/10.1109/bigdata.2015.7363938","mag":"2196958957"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata.2015.7363938","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2015.7363938","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2015 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5108689189","display_name":"Ben Miller","orcid":null},"institutions":[{"id":"https://openalex.org/I181565077","display_name":"Georgia State University","ror":"https://ror.org/03qt6ba18","country_code":"US","type":"education","lineage":["https://openalex.org/I181565077"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ben Miller","raw_affiliation_strings":["Departments of English and Communication, Georgia State University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Departments of English and Communication, Georgia State University","institution_ids":["https://openalex.org/I181565077"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073195077","display_name":"Jennifer Olive","orcid":null},"institutions":[{"id":"https://openalex.org/I181565077","display_name":"Georgia State University","ror":"https://ror.org/03qt6ba18","country_code":"US","type":"education","lineage":["https://openalex.org/I181565077"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jennifer Olive","raw_affiliation_strings":["Departments of English and Communication, Georgia State University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Departments of English and Communication, Georgia State University","institution_ids":["https://openalex.org/I181565077"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058180229","display_name":"Shakthidhar Gopavaram","orcid":null},"institutions":[{"id":"https://openalex.org/I592451","display_name":"Indiana University","ror":"https://ror.org/01kg8sb98","country_code":"US","type":"education","lineage":["https://openalex.org/I592451"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shakthidhar Gopavaram","raw_affiliation_strings":["Department of Computer Science, Indiana University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Indiana University","institution_ids":["https://openalex.org/I592451"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031155251","display_name":"Yanjun Zhao","orcid":"https://orcid.org/0000-0002-6567-0422"},"institutions":[{"id":"https://openalex.org/I149292303","display_name":"Troy University","ror":"https://ror.org/029jj9438","country_code":"US","type":"education","lineage":["https://openalex.org/I149292303"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yanjun Zhao","raw_affiliation_strings":["Department of Computer Science, Troy University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Troy University","institution_ids":["https://openalex.org/I149292303"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075541504","display_name":"Ayush Shrestha","orcid":"https://orcid.org/0009-0004-6203-3593"},"institutions":[{"id":"https://openalex.org/I149292303","display_name":"Troy University","ror":"https://ror.org/029jj9438","country_code":"US","type":"education","lineage":["https://openalex.org/I149292303"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ayush Shrestha","raw_affiliation_strings":["Department of Computer Science, Troy University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Troy University","institution_ids":["https://openalex.org/I149292303"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5019528003","display_name":"Cynthia M. Berger","orcid":"https://orcid.org/0000-0001-7876-3997"},"institutions":[{"id":"https://openalex.org/I181565077","display_name":"Georgia State University","ror":"https://ror.org/03qt6ba18","country_code":"US","type":"education","lineage":["https://openalex.org/I181565077"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Cynthia Berger","raw_affiliation_strings":["Department of Applied Linguistics, Georgia State University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Applied Linguistics, Georgia State University","institution_ids":["https://openalex.org/I181565077"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.06762777,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"45","issue":null,"first_page":"1673","last_page":"1677"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.993399977684021,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.828260064125061},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.7494763135910034},{"id":"https://openalex.org/keywords/narrative","display_name":"Narrative","score":0.7188124656677246},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.6136447191238403},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6118870973587036},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.5431153178215027},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5109983682632446},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.5029074549674988},{"id":"https://openalex.org/keywords/text-segmentation","display_name":"Text segmentation","score":0.49867987632751465},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.4871827960014343},{"id":"https://openalex.org/keywords/event","display_name":"Event (particle physics)","score":0.4627760350704193},{"id":"https://openalex.org/keywords/text-corpus","display_name":"Text corpus","score":0.41339990496635437},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.25018221139907837},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.21361884474754333}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.828260064125061},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.7494763135910034},{"id":"https://openalex.org/C199033989","wikidata":"https://www.wikidata.org/wiki/Q1318295","display_name":"Narrative","level":2,"score":0.7188124656677246},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.6136447191238403},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6118870973587036},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.5431153178215027},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5109983682632446},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.5029074549674988},{"id":"https://openalex.org/C98501671","wikidata":"https://www.wikidata.org/wiki/Q1948408","display_name":"Text segmentation","level":3,"score":0.49867987632751465},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.4871827960014343},{"id":"https://openalex.org/C2779662365","wikidata":"https://www.wikidata.org/wiki/Q5416694","display_name":"Event (particle physics)","level":2,"score":0.4627760350704193},{"id":"https://openalex.org/C2474386","wikidata":"https://www.wikidata.org/wiki/Q461183","display_name":"Text corpus","level":2,"score":0.41339990496635437},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.25018221139907837},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.21361884474754333},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigdata.2015.7363938","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2015.7363938","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2015 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6700000166893005,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W2000900121","https://openalex.org/W2001856540","https://openalex.org/W2044222399","https://openalex.org/W2081580037","https://openalex.org/W2133496072","https://openalex.org/W2158794898","https://openalex.org/W2251322122","https://openalex.org/W2252074111","https://openalex.org/W2282627701","https://openalex.org/W4249258521","https://openalex.org/W6679820939","https://openalex.org/W6691161265","https://openalex.org/W6695387643"],"related_works":["https://openalex.org/W2172629291","https://openalex.org/W2380773642","https://openalex.org/W2384559435","https://openalex.org/W2337707338","https://openalex.org/W2393940967","https://openalex.org/W2159591557","https://openalex.org/W2785359773","https://openalex.org/W2058548953","https://openalex.org/W2385598138","https://openalex.org/W2366925922"],"abstract_inverted_index":{"Identifying":[0],"similar":[1,95],"narrative":[2,47,101,114],"sections":[3],"across":[4,49],"longer":[5],"documents":[6],"would":[7],"help":[8],"identify":[9],"key":[10],"events":[11],"within":[12],"a":[13,21,71,127,135],"corpus,":[14],"enrich":[15],"understanding":[16],"of":[17,36,38,73,77,80,85,113,119,121],"those":[18,81],"events,":[19,74,82],"provide":[20],"mechanism":[22],"for":[23,33,46],"organizing":[24],"corpora":[25,52],"according":[26],"to":[27,87,97,109,151,153],"their":[28],"event":[29],"content,":[30],"and":[31,59,134],"allow":[32],"bottom-up":[34],"testing":[35],"theories":[37],"narrative.":[39],"This":[40,63],"paper":[41,148],"proposes":[42],"an":[43],"automated":[44],"method":[45,64,123],"alignment":[48],"large":[50],"textual":[51],"using":[53],"techniques":[54],"from":[55,159],"natural":[56],"language":[57],"processing":[58],"similarity-based":[60],"image":[61,89],"segmentation.":[62],"proceeds":[65],"by":[66],"segmenting":[67],"each":[68],"document":[69,157],"into":[70],"series":[72],"constructs":[75],"sequences":[76,86],"abstracted":[78],"representations":[79],"compares":[83],"pairs":[84],"generate":[88],"matrices,":[90],"segments":[91,96],"the":[92,106,111,154,161],"images,":[93],"identifies":[94],"discover":[98],"commonly":[99],"occurring":[100],"units,":[102],"and,":[103],"finally,":[104],"returns":[105],"source":[107],"sentences":[108],"make":[110],"clusters":[112],"similarity":[115],"readable.":[116],"Preliminary":[117],"tests":[118],"elements":[120],"this":[122,146],"were":[124],"conducted":[125],"on":[126],"small":[128],"heterogeneous":[129,137],"corpus":[130,138,158,163],"(<;":[131],"100":[132],"documents)":[133],"moderate":[136,162],"(10k":[139],"documents).":[140],"Further":[141],"implementation":[142],"as":[143],"described":[144],"in":[145],"position":[147],"is":[149],"necessary":[150],"scale":[152],"full":[155],"251k":[156],"which":[160],"was":[164],"drawn.":[165]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
