{"id":"https://openalex.org/W2049929449","doi":"https://doi.org/10.1145/2484028.2484139","title":"Building a web test collection using social media","display_name":"Building a web test collection using social media","publication_year":2013,"publication_date":"2013-07-28","ids":{"openalex":"https://openalex.org/W2049929449","doi":"https://doi.org/10.1145/2484028.2484139","mag":"2049929449"},"language":"en","primary_location":{"id":"doi:10.1145/2484028.2484139","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2484028.2484139","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 36th international ACM SIGIR conference on Research and development in information retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101614562","display_name":"Chia-Jung Lee","orcid":"https://orcid.org/0000-0001-6451-9344"},"institutions":[{"id":"https://openalex.org/I24603500","display_name":"University of Massachusetts Amherst","ror":"https://ror.org/0072zz521","country_code":"US","type":"education","lineage":["https://openalex.org/I24603500"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Chia-Jung Lee","raw_affiliation_strings":["University of Massachusetts Amherst, Amherst, MA, USA","University Of Massachusetts Amherst, Amherst, MA, USA#TAB#"],"affiliations":[{"raw_affiliation_string":"University of Massachusetts Amherst, Amherst, MA, USA","institution_ids":["https://openalex.org/I24603500"]},{"raw_affiliation_string":"University Of Massachusetts Amherst, Amherst, MA, USA#TAB#","institution_ids":["https://openalex.org/I24603500"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5105659698","display_name":"W. Bruce Croft","orcid":"https://orcid.org/0000-0003-2391-9629"},"institutions":[{"id":"https://openalex.org/I24603500","display_name":"University of Massachusetts Amherst","ror":"https://ror.org/0072zz521","country_code":"US","type":"education","lineage":["https://openalex.org/I24603500"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"W. Bruce Croft","raw_affiliation_strings":["University of Massachusetts Amherst, Amherst, MA, USA","University Of Massachusetts Amherst, Amherst, MA, USA#TAB#"],"affiliations":[{"raw_affiliation_string":"University of Massachusetts Amherst, Amherst, MA, USA","institution_ids":["https://openalex.org/I24603500"]},{"raw_affiliation_string":"University Of Massachusetts Amherst, Amherst, MA, USA#TAB#","institution_ids":["https://openalex.org/I24603500"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5101614562"],"corresponding_institution_ids":["https://openalex.org/I24603500"],"apc_list":null,"apc_paid":null,"fwci":0.8356,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.82963983,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"757","last_page":"760"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13274","display_name":"Expert finding and Q&A systems","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13274","display_name":"Expert finding and Q&A systems","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8044110536575317},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.7467088103294373},{"id":"https://openalex.org/keywords/relevance","display_name":"Relevance (law)","score":0.6506320238113403},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.6050736904144287},{"id":"https://openalex.org/keywords/test","display_name":"Test (biology)","score":0.593769371509552},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.5304286479949951},{"id":"https://openalex.org/keywords/social-media","display_name":"Social media","score":0.5262126922607422},{"id":"https://openalex.org/keywords/data-collection","display_name":"Data collection","score":0.501431941986084},{"id":"https://openalex.org/keywords/web-page","display_name":"Web page","score":0.4676639139652252},{"id":"https://openalex.org/keywords/the-internet","display_name":"The Internet","score":0.4151192903518677}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8044110536575317},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.7467088103294373},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.6506320238113403},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.6050736904144287},{"id":"https://openalex.org/C2777267654","wikidata":"https://www.wikidata.org/wiki/Q3519023","display_name":"Test (biology)","level":2,"score":0.593769371509552},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.5304286479949951},{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.5262126922607422},{"id":"https://openalex.org/C133462117","wikidata":"https://www.wikidata.org/wiki/Q4929239","display_name":"Data collection","level":2,"score":0.501431941986084},{"id":"https://openalex.org/C21959979","wikidata":"https://www.wikidata.org/wiki/Q36774","display_name":"Web page","level":2,"score":0.4676639139652252},{"id":"https://openalex.org/C110875604","wikidata":"https://www.wikidata.org/wiki/Q75","display_name":"The Internet","level":2,"score":0.4151192903518677},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/2484028.2484139","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2484028.2484139","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 36th international ACM SIGIR conference on Research and development in information retrieval","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.366.9304","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.366.9304","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://maroo.cs.umass.edu/pub/web/getpdf.php?id=1108","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.5899999737739563,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":11,"referenced_works":["https://openalex.org/W1507150160","https://openalex.org/W1685426458","https://openalex.org/W2000246295","https://openalex.org/W2021856948","https://openalex.org/W2053100920","https://openalex.org/W2070740689","https://openalex.org/W2107370612","https://openalex.org/W2109244020","https://openalex.org/W2124504084","https://openalex.org/W2169213601","https://openalex.org/W4246858749"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2085384747","https://openalex.org/W2088166309","https://openalex.org/W1891216533","https://openalex.org/W4312133475","https://openalex.org/W4238976562","https://openalex.org/W2276587472","https://openalex.org/W2615795876","https://openalex.org/W2049612369","https://openalex.org/W2770872919"],"abstract_inverted_index":{"Community":[0],"Question":[1],"Answering":[2],"(CQA)":[3],"platforms":[4],"contain":[5],"a":[6,30,35],"large":[7,138],"number":[8,139],"of":[9,20,33,49,129,140],"questions":[10,63],"and":[11,66],"associated":[12,68],"answers.":[13],"Answerers":[14],"sometimes":[15],"include":[16],"URLs":[17],"as":[18,64,72],"part":[19],"the":[21,43,57,67,103,111,120,127,137,148],"answers":[22,87],"to":[23,55,90],"provide":[24],"further":[25],"information.":[26],"This":[27],"paper":[28],"describes":[29],"novel":[31],"way":[32],"building":[34],"test":[36,58,131],"collection":[37,59,100],"for":[38,147],"web":[39,70],"search":[40],"by":[41,60],"exploiting":[42],"link":[44],"information":[45],"from":[46],"this":[47,77,99,144],"type":[48],"social":[50],"media":[51],"data.":[52],"We":[53],"propose":[54],"build":[56],"regarding":[61],"CQA":[62,84],"queries":[65,141],"linked":[69],"pages":[71],"relevant":[73],"documents.":[74],"To":[75],"evaluate":[76],"approach,":[78],"we":[79],"collect":[80],"approximately":[81],"ten":[82],"thousand":[83],"queries,":[85],"whose":[86],"contained":[88],"links":[89],"ClueWeb09":[91],"documents":[92],"after":[93],"spam":[94],"filtering.":[95],"Experimental":[96],"results":[97],"using":[98],"show":[101],"that":[102,118,136],"relative":[104],"effectiveness":[105],"between":[106],"different":[107],"retrieval":[108],"models":[109],"on":[110,119],"ClueWeb-CQA":[112],"query":[113,124],"set":[114],"is":[115],"consistent":[116],"with":[117],"TREC":[121],"Web":[122],"Track":[123],"sets,":[125],"confirming":[126],"reliability":[128],"our":[130],"collection.":[132],"Further":[133],"analysis":[134],"shows":[135],"generated":[142],"through":[143],"approach":[145],"compensates":[146],"sparse":[149],"relevance":[150],"judgments":[151],"in":[152],"determining":[153],"significant":[154],"differences.":[155]},"counts_by_year":[{"year":2018,"cited_by_count":1},{"year":2014,"cited_by_count":1}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
