{"id":"https://openalex.org/W2141233457","doi":"https://doi.org/10.1145/1321440.1321473","title":"Discovering interesting usage patterns in text collections","display_name":"Discovering interesting usage patterns in text collections","publication_year":2007,"publication_date":"2007-11-06","ids":{"openalex":"https://openalex.org/W2141233457","doi":"https://doi.org/10.1145/1321440.1321473","mag":"2141233457"},"language":"en","primary_location":{"id":"doi:10.1145/1321440.1321473","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1321440.1321473","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the sixteenth ACM conference on Conference on information and knowledge management","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5109498555","display_name":"Anthony Don","orcid":null},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Anthony Don","raw_affiliation_strings":["University of Maryland, College Park, MD"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Maryland, College Park, MD","institution_ids":["https://openalex.org/I66946132"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071079350","display_name":"Elena Zheleva","orcid":"https://orcid.org/0000-0001-7662-2568"},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Elena Zheleva","raw_affiliation_strings":["University of Maryland, College Park, MD"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Maryland, College Park, MD","institution_ids":["https://openalex.org/I66946132"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052371711","display_name":"Machon Gregory","orcid":null},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Machon Gregory","raw_affiliation_strings":["University of Maryland, College Park, MD"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Maryland, College Park, MD","institution_ids":["https://openalex.org/I66946132"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005999401","display_name":"Sureyya Tarkan","orcid":null},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sureyya Tarkan","raw_affiliation_strings":["University of Maryland, College Park, MD"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Maryland, College Park, MD","institution_ids":["https://openalex.org/I66946132"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020556428","display_name":"Loretta Auvil","orcid":null},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]},{"id":"https://openalex.org/I2801919071","display_name":"University of Illinois System","ror":"https://ror.org/05e94g991","country_code":"US","type":"education","lineage":["https://openalex.org/I2801919071"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Loretta Auvil","raw_affiliation_strings":["University of Illinois, Urbana, IL","[University of Illinois, Urbana, IL]"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Illinois, Urbana, IL","institution_ids":["https://openalex.org/I2801919071"]},{"raw_affiliation_string":"[University of Illinois, Urbana, IL]","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087287236","display_name":"Tanya Clement","orcid":null},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Tanya Clement","raw_affiliation_strings":["University of Maryland, College Park"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Maryland, College Park","institution_ids":["https://openalex.org/I66946132"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052623072","display_name":"Ben Shneiderman","orcid":"https://orcid.org/0000-0002-8298-1097"},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ben Shneiderman","raw_affiliation_strings":["University of Maryland, College Park, MD"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Maryland, College Park, MD","institution_ids":["https://openalex.org/I66946132"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5030084361","display_name":"Catherine Plaisant","orcid":"https://orcid.org/0000-0003-4049-5848"},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Catherine Plaisant","raw_affiliation_strings":["University of Maryland, College Park, MD"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Maryland, College Park, MD","institution_ids":["https://openalex.org/I66946132"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":19.8978,"has_fulltext":false,"cited_by_count":106,"citation_normalized_percentile":{"value":0.99112328,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"213","last_page":"222"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9837999939918518,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.967199981212616,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7711528539657593},{"id":"https://openalex.org/keywords/granularity","display_name":"Granularity","score":0.5654433369636536},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5118147730827332},{"id":"https://openalex.org/keywords/order","display_name":"Order (exchange)","score":0.5021202564239502},{"id":"https://openalex.org/keywords/repetition","display_name":"Repetition (rhetorical device)","score":0.4564518928527832},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.39493614435195923},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.09430250525474548}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7711528539657593},{"id":"https://openalex.org/C177774035","wikidata":"https://www.wikidata.org/wiki/Q1246948","display_name":"Granularity","level":2,"score":0.5654433369636536},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5118147730827332},{"id":"https://openalex.org/C182306322","wikidata":"https://www.wikidata.org/wiki/Q1779371","display_name":"Order (exchange)","level":2,"score":0.5021202564239502},{"id":"https://openalex.org/C2776141515","wikidata":"https://www.wikidata.org/wiki/Q1274479","display_name":"Repetition (rhetorical device)","level":2,"score":0.4564518928527832},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.39493614435195923},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.09430250525474548},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C10138342","wikidata":"https://www.wikidata.org/wiki/Q43015","display_name":"Finance","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/1321440.1321473","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1321440.1321473","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the sixteenth ACM conference on Conference on information and knowledge management","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.8799999952316284,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W110175884","https://openalex.org/W1484413656","https://openalex.org/W1489673536","https://openalex.org/W1506285740","https://openalex.org/W1594453896","https://openalex.org/W1974930421","https://openalex.org/W2079533881","https://openalex.org/W2094783359","https://openalex.org/W2101284865","https://openalex.org/W2116628377","https://openalex.org/W2119307930","https://openalex.org/W2141018272","https://openalex.org/W2150231504","https://openalex.org/W2167983404","https://openalex.org/W2797816625","https://openalex.org/W4285719527"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2931688134","https://openalex.org/W2377919138","https://openalex.org/W2378857091","https://openalex.org/W2999756192","https://openalex.org/W103652678","https://openalex.org/W4226090359","https://openalex.org/W2059697060","https://openalex.org/W936373746","https://openalex.org/W2975817033"],"abstract_inverted_index":{"This":[0,90],"paper":[1],"addresses":[2],"the":[3,25,62,70,88,96],"problem":[4],"of":[5,27,40,57,64,77,99,108],"making":[6],"text":[7,28,35,48,78,109,119,143],"mining":[8],"results":[9],"more":[10],"comprehensible":[11],"to":[12,23,45,94,116],"humanities":[13],"scholars,":[14],"journalists,":[15],"intelligence":[16],"analysts,":[17],"and":[18,42,84,132,138],"other":[19,118],"researchers,":[20],"in":[21,69,87],"order":[22],"support":[24],"analysis":[26],"collections.":[29,144],"Our":[30],"system,":[31],"FeatureLens1,":[32],"visualizes":[33],"a":[34,129],"collection":[36],"at":[37],"several":[38],"levels":[39],"granularity":[41],"enables":[43],"users":[44,93,134],"explore":[46,117],"interesting":[47,139],"patterns.":[49,110],"The":[50,111],"current":[51],"implementation":[52],"focuses":[53],"on":[54],"frequent":[55],"itemsets":[56],"n-grams,":[58],"as":[59,102,121],"they":[60],"capture":[61],"repetition":[63],"exact":[65],"or":[66,105],"similar":[67],"expressions":[68],"collection.":[71,89],"Users":[72],"can":[73],"find":[74],"meaningful":[75],"co-occurrences":[76],"patterns":[79],"by":[80],"visualizing":[81],"them":[82],"within":[83],"across":[85],"documents":[86],"also":[91],"permits":[92],"identify":[95],"temporal":[97],"evolution":[98],"usage":[100],"such":[101],"increasing,":[103],"decreasing":[104],"sudden":[106],"appearance":[107],"interface":[112],"could":[113],"be":[114],"used":[115],"features":[120],"well.":[122],"Initial":[123],"studies":[124],"suggest":[125],"that":[126],"FeatureLens":[127],"helped":[128],"literary":[130],"scholar":[131],"8":[133],"generate":[135],"new":[136],"hypotheses":[137],"insights":[140],"using":[141],"2":[142]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":5},{"year":2020,"cited_by_count":2},{"year":2018,"cited_by_count":7},{"year":2017,"cited_by_count":5},{"year":2016,"cited_by_count":7},{"year":2015,"cited_by_count":10},{"year":2014,"cited_by_count":4},{"year":2013,"cited_by_count":19},{"year":2012,"cited_by_count":9}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
