{"id":"https://openalex.org/W4243754476","doi":"https://doi.org/10.1109/jcdl.2014.6970166","title":"Detecting and modeling local text reuse","display_name":"Detecting and modeling local text reuse","publication_year":2014,"publication_date":"2014-09-01","ids":{"openalex":"https://openalex.org/W4243754476","doi":"https://doi.org/10.1109/jcdl.2014.6970166"},"language":"en","primary_location":{"id":"doi:10.1109/jcdl.2014.6970166","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jcdl.2014.6970166","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Joint Conference on Digital Libraries","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101722493","display_name":"David A. Smith","orcid":"https://orcid.org/0000-0002-6636-6940"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"David A. Smith","raw_affiliation_strings":["College of Computer and Information Science, Northeastern University Boston, MA, U.S.A"],"affiliations":[{"raw_affiliation_string":"College of Computer and Information Science, Northeastern University Boston, MA, U.S.A","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005843752","display_name":"Ryan Cordel","orcid":null},"institutions":[{"id":"https://openalex.org/I12912129","display_name":"Northeastern University","ror":"https://ror.org/04t5xt781","country_code":"US","type":"education","lineage":["https://openalex.org/I12912129"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ryan Cordel","raw_affiliation_strings":["Northeastern University, Boston, MA, US"],"affiliations":[{"raw_affiliation_string":"Northeastern University, Boston, MA, US","institution_ids":["https://openalex.org/I12912129"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008400357","display_name":"Elizabeth Maddock Dillon","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Elizabeth Maddock Dillon","raw_affiliation_strings":["English Department, Northeastern University Boston, MA, U.S.A"],"affiliations":[{"raw_affiliation_string":"English Department, Northeastern University Boston, MA, U.S.A","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021325471","display_name":"Nick Stramp","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nick Stramp","raw_affiliation_strings":["Political Science Department, University of Washington Seattle, WA, U.S.A"],"affiliations":[{"raw_affiliation_string":"Political Science Department, University of Washington Seattle, WA, U.S.A","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5112036981","display_name":"John Wilkerson","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"John Wilkerson","raw_affiliation_strings":["Political Science Department, University of Washington Seattle, WA, U.S.A"],"affiliations":[{"raw_affiliation_string":"Political Science Department, University of Washington Seattle, WA, U.S.A","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5101722493"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.7071,"has_fulltext":false,"cited_by_count":44,"citation_normalized_percentile":{"value":0.88296141,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"183","last_page":"192"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10799","display_name":"Data Visualization and Analytics","score":0.9890999794006348,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10799","display_name":"Data Visualization and Analytics","score":0.9890999794006348,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9807999730110168,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9731000065803528,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reuse","display_name":"Reuse","score":0.8738851547241211},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7422380447387695},{"id":"https://openalex.org/keywords/legislation","display_name":"Legislation","score":0.7301444411277771},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.3742143511772156},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.354996919631958},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3396620452404022},{"id":"https://openalex.org/keywords/law","display_name":"Law","score":0.1328044831752777},{"id":"https://openalex.org/keywords/political-science","display_name":"Political science","score":0.1286156177520752},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.09741133451461792}],"concepts":[{"id":"https://openalex.org/C206588197","wikidata":"https://www.wikidata.org/wiki/Q846574","display_name":"Reuse","level":2,"score":0.8738851547241211},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7422380447387695},{"id":"https://openalex.org/C2777351106","wikidata":"https://www.wikidata.org/wiki/Q49371","display_name":"Legislation","level":2,"score":0.7301444411277771},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3742143511772156},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.354996919631958},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3396620452404022},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.1328044831752777},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.1286156177520752},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.09741133451461792},{"id":"https://openalex.org/C548081761","wikidata":"https://www.wikidata.org/wiki/Q180388","display_name":"Waste management","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/jcdl.2014.6970166","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jcdl.2014.6970166","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Joint Conference on Digital Libraries","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W938539187","https://openalex.org/W1492995868","https://openalex.org/W1951628766","https://openalex.org/W1972174622","https://openalex.org/W1986022261","https://openalex.org/W2009904773","https://openalex.org/W2053107662","https://openalex.org/W2067272131","https://openalex.org/W2076489648","https://openalex.org/W2085922539","https://openalex.org/W2090320977","https://openalex.org/W2127492100","https://openalex.org/W2129070169","https://openalex.org/W2132399973","https://openalex.org/W2148578434","https://openalex.org/W2166036954","https://openalex.org/W2171150534","https://openalex.org/W4294541781","https://openalex.org/W6674629281","https://openalex.org/W7006202893"],"related_works":["https://openalex.org/W2380896940","https://openalex.org/W2372275786","https://openalex.org/W4317411830","https://openalex.org/W2360757248","https://openalex.org/W2391297446","https://openalex.org/W2049182572","https://openalex.org/W2374527051","https://openalex.org/W2495499255","https://openalex.org/W2351532294","https://openalex.org/W2387901866"],"abstract_inverted_index":{"Texts":[0],"propagate":[1],"through":[2],"many":[3],"social":[4],"networks":[5],"and":[6,14,50,79,97],"provide":[7],"evidence":[8],"for":[9,18],"their":[10],"structure.":[11],"We":[12,31],"describe":[13],"evaluate":[15,67],"efficient":[16],"algorithms":[17],"detecting":[19],"clusters":[20],"of":[21,42,53,71,82],"reused":[22],"passages":[23],"embedded":[24],"within":[25],"longer":[26],"documents":[27],"in":[28,45,57],"large":[29],"collections.":[30],"apply":[32],"these":[33,62],"techniques":[34,86],"to":[35,89],"two":[36],"case":[37,64],"studies:":[38],"analyzing":[39],"the":[40,46,51,58,69,72,80,83],"culture":[41],"free":[43],"reprinting":[44],"nineteenth-century":[47],"United":[48],"States":[49],"development":[52],"bills":[54],"into":[55],"legislation":[56],"U.S.":[59],"Congress.":[60],"Using":[61],"divergent":[63],"studies,":[65],"we":[66],"both":[68],"efficiency":[70],"approximate":[73],"local":[74],"text":[75],"reuse":[76],"detection":[77],"methods":[78],"accuracy":[81],"results.":[84],"These":[85],"allow":[87],"us":[88],"explore":[90],"how":[91],"ideas":[92,95],"spread,":[93,96],"which":[94,98],"subgroups":[99],"shared":[100],"ideas.":[101]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2022,"cited_by_count":19},{"year":2021,"cited_by_count":5},{"year":2020,"cited_by_count":5},{"year":2019,"cited_by_count":3},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":5},{"year":2015,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
