{"id":"https://openalex.org/W1992781401","doi":"https://doi.org/10.1145/2362724.2362773","title":"Towards realistic known-item topics for the ClueWeb","display_name":"Towards realistic known-item topics for the ClueWeb","publication_year":2012,"publication_date":"2012-08-21","ids":{"openalex":"https://openalex.org/W1992781401","doi":"https://doi.org/10.1145/2362724.2362773","mag":"1992781401"},"language":"en","primary_location":{"id":"doi:10.1145/2362724.2362773","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2362724.2362773","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 4th Information Interaction in Context Symposium","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5084915697","display_name":"Claudia Hauff","orcid":"https://orcid.org/0000-0001-9879-6470"},"institutions":[{"id":"https://openalex.org/I98358874","display_name":"Delft University of Technology","ror":"https://ror.org/02e2c7k09","country_code":"NL","type":"education","lineage":["https://openalex.org/I98358874"]}],"countries":["NL"],"is_corresponding":true,"raw_author_name":"Claudia Hauff","raw_affiliation_strings":["Delft University of Technology, Delft, The Netherlands"],"affiliations":[{"raw_affiliation_string":"Delft University of Technology, Delft, The Netherlands","institution_ids":["https://openalex.org/I98358874"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014322854","display_name":"Matthias Hagen","orcid":"https://orcid.org/0000-0002-9733-2890"},"institutions":[{"id":"https://openalex.org/I51441396","display_name":"Bauhaus-Universit\u00e4t Weimar","ror":"https://ror.org/033bb5z47","country_code":"DE","type":"education","lineage":["https://openalex.org/I51441396"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Matthias Hagen","raw_affiliation_strings":["Bauhaus-Universit\u00e4t Weimar, Weimar, Germany"],"affiliations":[{"raw_affiliation_string":"Bauhaus-Universit\u00e4t Weimar, Weimar, Germany","institution_ids":["https://openalex.org/I51441396"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004704820","display_name":"Anna Cornelia Beyer","orcid":null},"institutions":[{"id":"https://openalex.org/I51441396","display_name":"Bauhaus-Universit\u00e4t Weimar","ror":"https://ror.org/033bb5z47","country_code":"DE","type":"education","lineage":["https://openalex.org/I51441396"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Anna Beyer","raw_affiliation_strings":["Bauhaus-Universit\u00e4t Weimar, Weimar, Germany"],"affiliations":[{"raw_affiliation_string":"Bauhaus-Universit\u00e4t Weimar, Weimar, Germany","institution_ids":["https://openalex.org/I51441396"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5027915931","display_name":"Benno Stein","orcid":"https://orcid.org/0000-0001-9033-2217"},"institutions":[{"id":"https://openalex.org/I51441396","display_name":"Bauhaus-Universit\u00e4t Weimar","ror":"https://ror.org/033bb5z47","country_code":"DE","type":"education","lineage":["https://openalex.org/I51441396"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Benno Stein","raw_affiliation_strings":["Bauhaus-Universit\u00e4t Weimar, Weimar, Germany"],"affiliations":[{"raw_affiliation_string":"Bauhaus-Universit\u00e4t Weimar, Weimar, Germany","institution_ids":["https://openalex.org/I51441396"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5084915697"],"corresponding_institution_ids":["https://openalex.org/I98358874"],"apc_list":null,"apc_paid":null,"fwci":1.4771,"has_fulltext":false,"cited_by_count":10,"citation_normalized_percentile":{"value":0.87744249,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"274","last_page":"277"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12607","display_name":"Personal Information Management and User Behavior","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12607","display_name":"Personal Information Management and User Behavior","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9902999997138977,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9538000226020813,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.864511251449585},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.7422925233840942},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.687743067741394},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.482837975025177},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3784950077533722},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.327218234539032}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.864511251449585},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.7422925233840942},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.687743067741394},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.482837975025177},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3784950077533722},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.327218234539032},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/2362724.2362773","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2362724.2362773","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 4th Information Interaction in Context Symposium","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.261.1840","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.261.1840","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.uni-weimar.de/medien/webis/publications/papers/stein_2012n.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":17,"referenced_works":["https://openalex.org/W11620817","https://openalex.org/W91095625","https://openalex.org/W94637519","https://openalex.org/W1987003629","https://openalex.org/W1991332152","https://openalex.org/W2041583667","https://openalex.org/W2065132166","https://openalex.org/W2097127516","https://openalex.org/W2108566279","https://openalex.org/W2112175905","https://openalex.org/W2123365817","https://openalex.org/W2143131512","https://openalex.org/W2147770679","https://openalex.org/W2159665776","https://openalex.org/W4250633719","https://openalex.org/W6600477187","https://openalex.org/W6603899496"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2772917594","https://openalex.org/W4306742369","https://openalex.org/W2548721895","https://openalex.org/W4303457083","https://openalex.org/W2373456246","https://openalex.org/W4376623224","https://openalex.org/W2951359407","https://openalex.org/W2124566234","https://openalex.org/W3204019825"],"abstract_inverted_index":{"Known-item":[0],"finding":[1,34],"is":[2],"the":[3,43,57,94],"task":[4],"of":[5,15,39],"re-finding":[6],"and":[7,42,53],"re-accessing":[8],"an":[9],"item":[10,96],"previously":[11],"seen.":[12],"Typical":[13],"examples":[14],"known":[16,45,95],"items":[17],"include":[18],"accessed":[19],"Web":[20,64],"sites,":[21],"received":[22],"emails,":[23],"or":[24,86],"documents":[25],"on":[26,32,37],"one's":[27],"personal":[28],"desktop.":[29],"Current":[30],"research":[31],"known-item":[33,40],"heavily":[35],"relies":[36],"corpora":[38,50,80,103],"queries":[41,85,87],"respective":[44],"items.":[46],"However,":[47],"many":[48],"existing":[49,77],"are":[51],"proprietary":[52],"not":[54,71],"available":[55,79],"to":[56,104],"public":[58,102],"(in":[59],"particular":[60],"those":[61],"derived":[62],"from":[63],"query":[65],"logs),":[66],"a":[67],"fact":[68],"which":[69],"does":[70],"allow":[72],"for":[73],"repeatable":[74],"research.":[75],"The":[76],"publicly":[78],"either":[81],"contain":[82],"automatically":[83],"generated":[84,91],"that":[88],"were":[89],"manually":[90],"while":[92],"seeing":[93],"itself.":[97],"Hence,":[98],"we":[99],"consider":[100],"these":[101],"be":[105],"rather":[106],"artificial":[107],"in":[108],"nature.":[109]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":1},{"year":2015,"cited_by_count":2}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
