{"id":"https://openalex.org/W7128772917","doi":"https://doi.org/10.48550/arxiv.2602.11938","title":"Who is the richest club in the championship? Detecting and Rewriting Underspecified Questions Improve QA Performance","display_name":"Who is the richest club in the championship? Detecting and Rewriting Underspecified Questions Improve QA Performance","publication_year":2026,"publication_date":"2026-02-12","ids":{"openalex":"https://openalex.org/W7128772917","doi":"https://doi.org/10.48550/arxiv.2602.11938"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.11938","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5018135944","display_name":"Yan\u2010Hua Huang","orcid":"https://orcid.org/0000-0001-8505-1621"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Huang, Yunchong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086285176","display_name":"Gianni Barlacchi","orcid":"https://orcid.org/0000-0002-9896-0610"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Barlacchi, Gianni","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5125992154","display_name":"Sandro Pezzelle","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pezzelle, Sandro","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5018135944"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.2996000051498413,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.2996000051498413,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.12139999866485596,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.10080000013113022,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/underspecification","display_name":"Underspecification","score":0.9124000072479248},{"id":"https://openalex.org/keywords/rewriting","display_name":"Rewriting","score":0.6176999807357788},{"id":"https://openalex.org/keywords/clarity","display_name":"CLARITY","score":0.4957999885082245},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.45329999923706055},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.3959999978542328}],"concepts":[{"id":"https://openalex.org/C2779631151","wikidata":"https://www.wikidata.org/wiki/Q7883767","display_name":"Underspecification","level":2,"score":0.9124000072479248},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7412999868392944},{"id":"https://openalex.org/C154690210","wikidata":"https://www.wikidata.org/wiki/Q1668499","display_name":"Rewriting","level":2,"score":0.6176999807357788},{"id":"https://openalex.org/C2777146004","wikidata":"https://www.wikidata.org/wiki/Q14949826","display_name":"CLARITY","level":2,"score":0.4957999885082245},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4925999939441681},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.45329999923706055},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4336000084877014},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.3959999978542328},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.3682999908924103},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.29120001196861267},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.2890999913215637},{"id":"https://openalex.org/C527412718","wikidata":"https://www.wikidata.org/wiki/Q855395","display_name":"Interpretation (philosophy)","level":2,"score":0.26600000262260437}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.11938","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.11938","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.11938","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.11938","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"language":[1],"models":[2],"(LLMs)":[3],"perform":[4,76],"well":[5],"on":[6,79],"well-posed":[7],"questions,":[8],"yet":[9],"standard":[10],"question-answering":[11],"(QA)":[12],"benchmarks":[13],"remain":[14],"far":[15],"from":[16,125],"solved.":[17],"We":[18],"argue":[19],"that":[20,63,74,93,119],"this":[21,42,116],"gap":[22],"is":[23],"partly":[24],"due":[25],"to":[26,49,56,65,147],"underspecified":[27,51,72,100],"questions":[28,52,70,101],"-":[29],"queries":[30],"whose":[31],"interpretation":[32],"cannot":[33],"be":[34],"uniquely":[35],"determined":[36],"without":[37],"additional":[38],"context.":[39],"To":[40,81],"test":[41],"hypothesis,":[43],"we":[44,87],"introduce":[45],"an":[46,96,137],"LLM-based":[47],"classifier":[48],"identify":[50],"and":[53,73,143],"apply":[54],"it":[55],"several":[57],"widely":[58],"used":[59],"QA":[60,111,122,141],"datasets,":[61],"finding":[62],"16%":[64],"over":[66],"50%":[67],"of":[68,85],"benchmark":[69,151],"are":[71],"LLMs":[75],"significantly":[77],"worse":[78],"them.":[80],"isolate":[82],"the":[83],"effect":[84],"underspecification,":[86],"conduct":[88],"a":[89],"controlled":[90],"rewriting":[91,99],"experiment":[92],"serves":[94],"as":[95,136],"upper-bound":[97],"analysis,":[98],"into":[102],"fully":[103],"specified":[104],"variants":[105],"while":[106],"holding":[107],"gold":[108],"answers":[109],"fixed.":[110],"performance":[112],"consistently":[113],"improves":[114],"under":[115],"setting,":[117],"indicating":[118],"many":[120],"apparent":[121],"failures":[123],"stem":[124],"question":[126,148],"underspecification":[127,135],"rather":[128],"than":[129],"model":[130],"limitations.":[131],"Our":[132],"findings":[133],"highlight":[134],"important":[138],"confound":[139],"in":[140,150],"evaluation":[142],"motivate":[144],"greater":[145],"attention":[146],"clarity":[149],"design.":[152]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-14T00:00:00"}
