{"id":"https://openalex.org/W6911845125","doi":"https://doi.org/10.5281/zenodo.14748980","title":"Webis Crowd RAG Corpus 2025","display_name":"Webis Crowd RAG Corpus 2025","publication_year":2025,"publication_date":"2025-01-27","ids":{"openalex":"https://openalex.org/W6911845125","doi":"https://doi.org/10.5281/zenodo.14748980"},"language":"en","primary_location":{"id":"doi:10.5281/zenodo.14748980","is_oa":true,"landing_page_url":"https://doi.org/10.5281/zenodo.14748980","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"dataset"},"type":"dataset","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.5281/zenodo.14748980","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Gienapp, Lukas","orcid":"https://orcid.org/0000-0001-5707-3751"},"institutions":[{"id":"https://openalex.org/I4401726909","display_name":"Center for Scalable Data Analytics and Artificial Intelligence","ror":"https://ror.org/01t4ttr56","country_code":"DE","type":"education","lineage":["https://openalex.org/I4401726909","https://openalex.org/I78650965","https://openalex.org/I926574661"]},{"id":"https://openalex.org/I926574661","display_name":"Leipzig University","ror":"https://ror.org/03s7gtk40","country_code":"DE","type":"education","lineage":["https://openalex.org/I926574661"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Gienapp, Lukas","raw_affiliation_strings":["Leipzig University","Center for Scalable Data Analytics and Artificial Intelligence"],"affiliations":[{"raw_affiliation_string":"Leipzig University","institution_ids":["https://openalex.org/I926574661"]},{"raw_affiliation_string":"Center for Scalable Data Analytics and Artificial Intelligence","institution_ids":["https://openalex.org/I4401726909"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Hagen, Tim","orcid":"https://orcid.org/0009-0000-4854-7249"},"institutions":[{"id":"https://openalex.org/I106157433","display_name":"University of Kassel","ror":"https://ror.org/04zc7p361","country_code":"DE","type":"education","lineage":["https://openalex.org/I106157433"]},{"id":"https://openalex.org/I4210164862","display_name":"Artificial Intelligence in Medicine (Canada)","ror":"https://ror.org/05p590m36","country_code":"CA","type":"company","lineage":["https://openalex.org/I4210164862"]}],"countries":["CA","DE"],"is_corresponding":false,"raw_author_name":"Hagen, Tim","raw_affiliation_strings":["University of Kassel","Hessian Center for Artificial Intelligence"],"affiliations":[{"raw_affiliation_string":"University of Kassel","institution_ids":["https://openalex.org/I106157433"]},{"raw_affiliation_string":"Hessian Center for Artificial Intelligence","institution_ids":["https://openalex.org/I4210164862"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Fr\u00f6be, Maik","orcid":"https://orcid.org/0000-0002-1003-981X"},"institutions":[{"id":"https://openalex.org/I76198965","display_name":"Friedrich Schiller University Jena","ror":"https://ror.org/05qpz1x62","country_code":"DE","type":"education","lineage":["https://openalex.org/I76198965"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Fr\u00f6be, Maik","raw_affiliation_strings":["Friedrich Schiller University Jena"],"affiliations":[{"raw_affiliation_string":"Friedrich Schiller University Jena","institution_ids":["https://openalex.org/I76198965"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Hagen, Matthias","orcid":"https://orcid.org/0000-0002-9733-2890"},"institutions":[{"id":"https://openalex.org/I76198965","display_name":"Friedrich Schiller University Jena","ror":"https://ror.org/05qpz1x62","country_code":"DE","type":"education","lineage":["https://openalex.org/I76198965"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Hagen, Matthias","raw_affiliation_strings":["Friedrich Schiller University Jena"],"affiliations":[{"raw_affiliation_string":"Friedrich Schiller University Jena","institution_ids":["https://openalex.org/I76198965"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Stein, Benno","orcid":"https://orcid.org/0000-0001-9033-2217"},"institutions":[{"id":"https://openalex.org/I51441396","display_name":"Bauhaus-Universit\u00e4t Weimar","ror":"https://ror.org/033bb5z47","country_code":"DE","type":"education","lineage":["https://openalex.org/I51441396"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Stein, Benno","raw_affiliation_strings":["Bauhaus-Universit\u00e4t Weimar"],"affiliations":[{"raw_affiliation_string":"Bauhaus-Universit\u00e4t Weimar","institution_ids":["https://openalex.org/I51441396"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Potthast, Martin","orcid":"https://orcid.org/0000-0003-2451-0665"},"institutions":[{"id":"https://openalex.org/I106157433","display_name":"University of Kassel","ror":"https://ror.org/04zc7p361","country_code":"DE","type":"education","lineage":["https://openalex.org/I106157433"]},{"id":"https://openalex.org/I4210164862","display_name":"Artificial Intelligence in Medicine (Canada)","ror":"https://ror.org/05p590m36","country_code":"CA","type":"company","lineage":["https://openalex.org/I4210164862"]},{"id":"https://openalex.org/I4401726909","display_name":"Center for Scalable Data Analytics and Artificial Intelligence","ror":"https://ror.org/01t4ttr56","country_code":"DE","type":"education","lineage":["https://openalex.org/I4401726909","https://openalex.org/I78650965","https://openalex.org/I926574661"]}],"countries":["CA","DE"],"is_corresponding":false,"raw_author_name":"Potthast, Martin","raw_affiliation_strings":["University of Kassel","Center for Scalable Data Analytics and Artificial Intelligence","Hessian Center for Artificial Intelligence"],"affiliations":[{"raw_affiliation_string":"University of Kassel","institution_ids":["https://openalex.org/I106157433"]},{"raw_affiliation_string":"Center for Scalable Data Analytics and Artificial Intelligence","institution_ids":["https://openalex.org/I4401726909"]},{"raw_affiliation_string":"Hessian Center for Artificial Intelligence","institution_ids":["https://openalex.org/I4210164862"]}]},{"author_position":"last","author":{"id":null,"display_name":"Scells, Harrisen","orcid":"https://orcid.org/0000-0001-9578-7157"},"institutions":[{"id":"https://openalex.org/I106157433","display_name":"University of Kassel","ror":"https://ror.org/04zc7p361","country_code":"DE","type":"education","lineage":["https://openalex.org/I106157433"]},{"id":"https://openalex.org/I4210164862","display_name":"Artificial Intelligence in Medicine (Canada)","ror":"https://ror.org/05p590m36","country_code":"CA","type":"company","lineage":["https://openalex.org/I4210164862"]}],"countries":["CA","DE"],"is_corresponding":false,"raw_author_name":"Scells, Harrisen","raw_affiliation_strings":["University of Kassel","Hessian Center for Artificial Intelligence"],"affiliations":[{"raw_affiliation_string":"University of Kassel","institution_ids":["https://openalex.org/I106157433"]},{"raw_affiliation_string":"Hessian Center for Artificial Intelligence","institution_ids":["https://openalex.org/I4210164862"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I4401726909","https://openalex.org/I926574661"],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":null,"topics":[],"keywords":[{"id":"https://openalex.org/keywords/string","display_name":"String (physics)","score":0.7670999765396118},{"id":"https://openalex.org/keywords/string-metric","display_name":"String metric","score":0.5812000036239624},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5810999870300293},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.41819998621940613},{"id":"https://openalex.org/keywords/dimension","display_name":"Dimension (graph theory)","score":0.4088999927043915},{"id":"https://openalex.org/keywords/value","display_name":"Value (mathematics)","score":0.40139999985694885}],"concepts":[{"id":"https://openalex.org/C157486923","wikidata":"https://www.wikidata.org/wiki/Q1376436","display_name":"String (physics)","level":2,"score":0.7670999765396118},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6985999941825867},{"id":"https://openalex.org/C22820288","wikidata":"https://www.wikidata.org/wiki/Q9050568","display_name":"String metric","level":4,"score":0.5812000036239624},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5810999870300293},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.48539999127388},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.41819998621940613},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4138000011444092},{"id":"https://openalex.org/C33676613","wikidata":"https://www.wikidata.org/wiki/Q13415176","display_name":"Dimension (graph theory)","level":2,"score":0.4088999927043915},{"id":"https://openalex.org/C2776291640","wikidata":"https://www.wikidata.org/wiki/Q2912517","display_name":"Value (mathematics)","level":2,"score":0.40139999985694885},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.36500000953674316},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3637000024318695},{"id":"https://openalex.org/C56666940","wikidata":"https://www.wikidata.org/wiki/Q788790","display_name":"Documentation","level":2,"score":0.35830000042915344},{"id":"https://openalex.org/C7757238","wikidata":"https://www.wikidata.org/wiki/Q374040","display_name":"String searching algorithm","level":3,"score":0.3253999948501587},{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.32350000739097595},{"id":"https://openalex.org/C2776445246","wikidata":"https://www.wikidata.org/wiki/Q1792644","display_name":"Style (visual arts)","level":2,"score":0.3222000002861023},{"id":"https://openalex.org/C13622073","wikidata":"https://www.wikidata.org/wiki/Q2243831","display_name":"Writing style","level":2,"score":0.27639999985694885}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.5281/zenodo.14748980","is_oa":true,"landing_page_url":"https://doi.org/10.5281/zenodo.14748980","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"dataset"}],"best_oa_location":{"id":"doi:10.5281/zenodo.14748980","is_oa":true,"landing_page_url":"https://doi.org/10.5281/zenodo.14748980","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"dataset"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Data":[0],"Documentation":[1],"responses.jsonl.gz":[2],"RAG":[3,89,108,129,238,478],"responses":[4,373],"of":[5,26,38,49,59,78,85,95,110,116,131,177,216,244,260,276,286,304,329,340,362,382,456,484,500,573,584,606,628,650,672,694,716],"about":[6],"250":[7],"words":[8],"written":[9,52,68,138],"by":[10,69,139,152,187,296,427,531,550],"human":[11,74,141],"writers":[12],"and":[13,335],"LLMs":[14],"in":[15,248,264,488,504],"different":[16],"response":[17,23,28,51,183,220,233,247,263,351,393,423,460,473,487,503,570],"styles.":[18],"Key":[19,209,449,566],"Description":[20,210,450,567],"Source":[21,211,451,568],"Values":[22],"The":[24,35,46,82,93,114,135,190,214,229,242,258,274,289,313,338,360,380,402,430,454,469,482,498,514,528,571,580,602,624,646,668,690,712],"UUID":[25,33,215,227,243,256,259,272,287,455,467,483,496,499,512,572,578],"the":[27,50,96,117,140,170,217,245,261,277,293,297,322,341,347,363,369,383,389,409,457,485,501,517,532,574],"/":[29],"task.":[30,40,55],"Task":[31,41,56,75,225,254,270,283,465,494,510,522,576],"Specification":[32,42,57,76,226,255,271,284,466,495,511,523,577],"topic":[34,36,230,470,564,595,617,639,661,683,705,727],"ID":[37,44,240,480],"this":[39,54,65,86,101,122,219,232,249,265,281,459,472,489,505,535,585,607,629,651,673,695,717],"String":[43,90,111,132,147,161,239,479],"style":[45,48],"text":[47,66,84,134,136],"for":[53,100,121,198,292,321,346,368,388,408,438,534],"One":[58,77],"essay,":[60],"news,":[61],"bullet":[62],"kind":[63],"Whether":[64],"was":[67,222,462],"an":[70,428],"LLM":[71,533,537],"or":[72,143,310,417,525,541],"a":[73,345,551],"human,":[79],"llm":[80],"query":[81,83],"topic.":[87],"TREC":[88,107,128,237,477],"value":[91],"references_ids":[92,127,172],"IDs":[94,112],"20":[97,118],"sources":[98,119],"retrieved":[99,120],"topics'":[102,123],"query.":[103,124],"Aligned":[104,125],"with":[105,126,169,318,405],"references_texts":[106,113],"List":[109,130,176,285,303,328],"texts":[115],"values":[133,561],"as":[137,150,185,425,548,559],"author":[142],"LLM.":[144,429],"Writing":[145,159,174],"Survey":[146,160,175],"cleaned_text":[148],"Text":[149,163],"cleaned":[151],"our":[153],"preprocessing":[154],"pipeline,":[155],"without":[156],"reference":[157],"markers.":[158],"statements":[162],"parsed":[164],"into":[165],"individual":[166,290,314,526],"statements,":[167],"each":[168,199,306,319,331,439],"corresponding":[171],"cited.":[173],"Dictionaries":[178],"ratings.jsonl.gz":[179],"Ratings":[180,420],"on":[181,421],"pairwise":[182,422],"utility":[184,424],"given":[186,426,530],"crowd":[188],"workers.":[189,299],"columns":[191,431],"prefixed":[192,432],"{dimension}":[193,433,527],"below":[194,434],"are":[195,435],"included":[196,436],"once":[197,437],"possible":[200,440],"dimension":[201,295,349,371,391,441],"(correctness_topical,":[202,442],"coherence_logical,":[203,443],"coherence_stylistic,":[204,444],"coverage_broad,":[205,445],"coverage_deep,":[206,446],"consistency_internal,":[207,447],"quality_overall).":[208,448],"Value":[212,452,569],"submission_id":[213,453],"questionnaire":[218,458],"pair":[221,234,250,266,461,474,490,506],"rated":[223,463],"by.":[224,464],"query_id":[228,468],"id":[231,471],"belongs":[235,475],"to.":[236,476],"response_a":[241,481],"first":[246,486],"(displayed":[251,267,491,507],"lefthand":[252,492],"side).":[253,269,493,509],"response_b":[257,497],"second":[262,502],"righthand":[268,508],"worker":[273],"UUIDs":[275],"5":[278,298],"workers":[279],"completing":[280],"questionnaire.":[282],"{dimension}_vote":[288],"votes":[291],"specified":[294,323,348,370,390,410],"Prolific":[300,325,355,375,397,412],"Crowd":[301,326,356,376,398,413],"Workers":[302,327,357,377,399,414],"string,":[305],"entry":[307,332],"a,":[308,415,539],"n,":[309,416,540],"b":[311,387,418,542],"{dimension}_spam_probability":[312],"spam":[315],"probabilities":[316],"associated":[317],"vote":[320],"dimension.":[324,411],"float,":[330],"between":[333],"0":[334],"1":[336],"{dimension}_p_a":[337],"probability":[339,361,381,407],"gold":[342,364,384,403],"label":[343,365,385,404],"being":[344,366,386],"(first":[350],"better":[352,394],"than":[353,395],"second).":[354],"float":[358,378,400],"{dimension}_p_n":[359],"n":[367],"(both":[372],"equal).":[374],"{dimension}_p_b":[379],"(second":[392],"first).":[396],"{dimension}_gold":[401],"highest":[406],"llm_ratings.jsonl.gz":[419],"inference":[513,515],"mode":[516],"judgments":[518],"were":[519],"collected":[520],"with.":[521],"combined,":[524],"rating":[529],"{dimension}.":[536],"Inference":[538,588,610,632,654,676,698,720],"grades.jsonl.gz":[543],"Pointwise,":[544],"per-topic":[545],"ranked":[546],"grades":[547],"inferred":[549],"Bradley-Terry":[552,590,612,634,656,678,700,722],"probabilistic":[553],"model.":[554],"Not":[555],"to":[556],"be":[557],"used":[558],"absolute":[560],"across":[562],"their":[563],"context!":[565],"response.":[575,586,608,630,652,674,696,718],"correctness_topical":[579],"topical":[581],"correctness":[582],"grade":[583,605,627,649,671,693,715],"Pairwise":[587,609,631,653,675,697,719],"w.":[589,611,633,655,677,699,721],"Model":[591,613,635,657,679,701,723],"Integer,":[592,614,636,658,680,702,724],"1-6,":[593,615,637,659,681,703,725],"per":[594,616,638,660,682,704,726],"relative":[596,618,640,662,684,706,728],"ranks,":[597,619,641,663,685,707,729],"higher":[598,620,642,664,686,708,730],"is":[599,621,643,665,687,709,731],"better.":[600,622,644,666,688,710,732],"coherence_logical":[601],"logical":[603],"coherence":[604,626],"coherence_stylistic":[623],"stylistic":[625],"coverage_broad":[645],"broad":[647],"coverage":[648,670],"coverage_deep":[667],"deep":[669],"consistency_internal":[689],"internal":[691],"consistency":[692],"quality_overall":[711],"overall":[713],"quality":[714]},"counts_by_year":[],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
