{"id":"https://openalex.org/W4412377072","doi":"https://doi.org/10.1145/3726302.3730275","title":"Researchy Questions: A Dataset of Multi-Perspective, Decompositional Questions for Deep Research","display_name":"Researchy Questions: A Dataset of Multi-Perspective, Decompositional Questions for Deep Research","publication_year":2025,"publication_date":"2025-07-13","ids":{"openalex":"https://openalex.org/W4412377072","doi":"https://doi.org/10.1145/3726302.3730275"},"language":"en","primary_location":{"id":"doi:10.1145/3726302.3730275","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3726302.3730275","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3726302.3730275","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 48th International ACM SIGIR Conference on Research and Development in Information Retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3726302.3730275","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5026219235","display_name":"Corby Rosset","orcid":"https://orcid.org/0000-0001-9167-6214"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Corbin Rosset","raw_affiliation_strings":["Microsoft, Redmond, WA, USA"],"affiliations":[{"raw_affiliation_string":"Microsoft, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022914972","display_name":"Hyunsong Chung","orcid":"https://orcid.org/0000-0002-2490-4712"},"institutions":[{"id":"https://openalex.org/I16733864","display_name":"National Taiwan University","ror":"https://ror.org/05bqach95","country_code":"TW","type":"education","lineage":["https://openalex.org/I16733864"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Ho-Lam Chung","raw_affiliation_strings":["National Taiwan University, Taipei, Taiwan"],"affiliations":[{"raw_affiliation_string":"National Taiwan University, Taipei, Taiwan","institution_ids":["https://openalex.org/I16733864"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010680967","display_name":"Guanghui Qin","orcid":"https://orcid.org/0000-0002-3009-8614"},"institutions":[{"id":"https://openalex.org/I145311948","display_name":"Johns Hopkins University","ror":"https://ror.org/00za53h95","country_code":"US","type":"education","lineage":["https://openalex.org/I145311948"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Guanghui Qin","raw_affiliation_strings":["Johns Hopkins University, Baltimore, MD, USA"],"affiliations":[{"raw_affiliation_string":"Johns Hopkins University, Baltimore, MD, USA","institution_ids":["https://openalex.org/I145311948"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089943934","display_name":"Ethan C. Chau","orcid":null},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ethan Chau","raw_affiliation_strings":["Microsoft, Redmond, WA, USA"],"affiliations":[{"raw_affiliation_string":"Microsoft, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111483945","display_name":"Zhuo Feng","orcid":null},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhuo Feng","raw_affiliation_strings":["Microsoft, Redmond, WA, USA"],"affiliations":[{"raw_affiliation_string":"Microsoft, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021000040","display_name":"Ahmed Hassan Awadallah","orcid":"https://orcid.org/0000-0001-6426-3537"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ahmed Awadallah","raw_affiliation_strings":["Microsoft, Redmond, WA, USA"],"affiliations":[{"raw_affiliation_string":"Microsoft, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Jennifer Neville","orcid":"https://orcid.org/0009-0007-1157-018X"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jennifer Neville","raw_affiliation_strings":["Microsoft, Redmond, WA, USA"],"affiliations":[{"raw_affiliation_string":"Microsoft, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5081428282","display_name":"Nikhil Rao","orcid":"https://orcid.org/0000-0003-0281-932X"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Nikhil Rao","raw_affiliation_strings":["Microsoft, Redmond, WA, USA"],"affiliations":[{"raw_affiliation_string":"Microsoft, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5026219235"],"corresponding_institution_ids":["https://openalex.org/I1290206253"],"apc_list":null,"apc_paid":null,"fwci":4.8506,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.94894562,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"3712","last_page":"3722"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9596999883651733,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9510999917984009,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.7888004779815674},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6115527749061584},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.4864034950733185},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4615137577056885},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3494557738304138}],"concepts":[{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.7888004779815674},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6115527749061584},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.4864034950733185},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4615137577056885},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3494557738304138}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3726302.3730275","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3726302.3730275","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3726302.3730275","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 48th International ACM SIGIR Conference on Research and Development in Information Retrieval","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3726302.3730275","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3726302.3730275","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3726302.3730275","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 48th International ACM SIGIR Conference on Research and Development in Information Retrieval","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.5600000023841858,"id":"https://metadata.un.org/sdg/13","display_name":"Climate action"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4412377072.pdf","grobid_xml":"https://content.openalex.org/works/W4412377072.grobid-xml"},"referenced_works_count":21,"referenced_works":["https://openalex.org/W2069049590","https://openalex.org/W2116938310","https://openalex.org/W2124063543","https://openalex.org/W2196221440","https://openalex.org/W2252136820","https://openalex.org/W2950681488","https://openalex.org/W2998702515","https://openalex.org/W3099700870","https://openalex.org/W3101082165","https://openalex.org/W3156789018","https://openalex.org/W3169841173","https://openalex.org/W3171446839","https://openalex.org/W3197149826","https://openalex.org/W4284689799","https://openalex.org/W4284691825","https://openalex.org/W4385569757","https://openalex.org/W4385571271","https://openalex.org/W4385572079","https://openalex.org/W4389520103","https://openalex.org/W4389520468","https://openalex.org/W4408666882"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2018871932","https://openalex.org/W3204019825"],"abstract_inverted_index":{"Existing":[0],"question":[1],"answering":[2,174,183],"(QA)":[3],"datasets":[4],"are":[5,91],"no":[6],"longer":[7],"challenging":[8],"to":[9,40,43,117,143],"most":[10,88],"powerful":[11],"Large":[12],"Language":[13],"Models":[14],"(LLMs).":[15],"Traditional":[16],"QA":[17],"benchmarks":[18],"like":[19,97,163,176],"TriviaQA,":[20],"NaturalQuestions,":[21],"ELI5":[22],"and":[23,38,129,147,165],"HotpotQA":[24],"mainly":[25],"study":[26],"''known":[27],"unknowns''":[28],"with":[29,193,199],"clear":[30],"indications":[31],"of":[32,51,58,66,115,133,161],"both":[33],"what":[34],"information":[35,68],"is":[36,55,85],"missing,":[37],"how":[39],"find":[41,77],"it":[42],"answer":[44],"the":[45,52,125],"question.":[46,212],"A":[47],"yet":[48],"unmet":[49],"need":[50],"NLP":[53],"community":[54],"a":[56,63,101,194],"bank":[57],"non-factoid,":[59,145],"multi-perspective":[60],"questions":[61,79,136,158],"involving":[62],"great":[64],"deal":[65],"unclear":[67],"needs,":[69],"i.e.":[70],"''unknown":[71],"unknowns''.":[72],"We":[73,121,149,168,185],"claim":[74],"we":[75],"can":[76],"such":[78,111],"in":[80,159],"search":[81,140],"engine":[82,141],"logs,":[83],"which":[84],"surprising":[86],"because":[87],"question-intent":[89],"queries":[90],"indeed":[92],"factoid.":[93],"Furthermore,":[94],"recent":[95],"products":[96],"Google's":[98],"DeepResearch":[99],"(announced":[100],"year":[102],"after":[103],"this":[104],"resource":[105],"was":[106],"released":[107],"publicly)":[108],"specifically":[109],"address":[110],"queries,":[112],"retrieving":[113],"hundreds":[114],"documents":[116],"synthesize":[118],"report-style":[119],"responses.":[120],"present":[122],"Researchy":[123,191],"Questions,":[124],"world's":[126],"first,":[127],"only":[128],"largest":[130],"public":[131],"dataset":[132],"''Deep":[134],"Research''":[135],"filtered":[137],"from":[138],"real":[139],"logs":[142],"be":[144],"''decompositional''":[146],"multi-perspective.":[148],"show":[150,170],"that":[151,171,207],"users":[152],"spend":[153],"substantial":[154],"''effort''":[155],"on":[156,202],"these":[157],"terms":[160],"signals":[162],"clicks":[164],"session":[166],"length.":[167],"also":[169],"''slow":[172],"thinking''":[173],"techniques,":[175],"decomposition":[177],"into":[178],"sub-questions":[179],"shows":[180],"benefit":[181],"over":[182,203],"directly.":[184],"release":[186],"(at":[187],"https://huggingface.co/datasets/corbyrosset/researchy_questions)":[188],"about":[189],"100k":[190],"Questions":[192],"permissive":[195],"CDLA-2.0":[196],"license,":[197],"along":[198],"click":[200],"histograms":[201],"350k":[204],"Clueweb22":[205],"URLs":[206],"were":[208],"clicked":[209],"for":[210],"each":[211]},"counts_by_year":[{"year":2026,"cited_by_count":2}],"updated_date":"2026-04-02T15:55:50.835912","created_date":"2025-10-10T00:00:00"}
