{"id":"https://openalex.org/W7138917939","doi":"https://doi.org/10.48550/arxiv.2603.15723","title":"Context-Length Robustness in Question Answering Models: A Comparative Empirical Study","display_name":"Context-Length Robustness in Question Answering Models: A Comparative Empirical Study","publication_year":2026,"publication_date":"2026-03-16","ids":{"openalex":"https://openalex.org/W7138917939","doi":"https://doi.org/10.48550/arxiv.2603.15723"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.15723","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.15723","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.15723","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5126670493","display_name":"Trishita Dhara","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Dhara, Trishita","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5047845479","display_name":"Siddhesh Sheth","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sheth, Siddhesh","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5126670493"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.8468000292778015,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.8468000292778015,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.04989999905228615,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13274","display_name":"Expert finding and Q&A systems","score":0.019200000911951065,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.8658000230789185},{"id":"https://openalex.org/keywords/empirical-research","display_name":"Empirical research","score":0.5385000109672546},{"id":"https://openalex.org/keywords/context-model","display_name":"Context model","score":0.4587000012397766},{"id":"https://openalex.org/keywords/question-answering","display_name":"Question answering","score":0.4586000144481659},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.43470001220703125},{"id":"https://openalex.org/keywords/context-effect","display_name":"Context effect","score":0.3880999982357025}],"concepts":[{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.8658000230789185},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.714900016784668},{"id":"https://openalex.org/C120936955","wikidata":"https://www.wikidata.org/wiki/Q2155640","display_name":"Empirical research","level":2,"score":0.5385000109672546},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.48730000853538513},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.4587000012397766},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.4586000144481659},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.43470001220703125},{"id":"https://openalex.org/C76188268","wikidata":"https://www.wikidata.org/wiki/Q1783165","display_name":"Context effect","level":3,"score":0.3880999982357025},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.37450000643730164},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.37400001287460327},{"id":"https://openalex.org/C2983643213","wikidata":"https://www.wikidata.org/wiki/Q6030225","display_name":"Influence function","level":3,"score":0.35199999809265137},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.2824999988079071},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.2624000012874603}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.15723","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.15723","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.15723","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.15723","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities","score":0.4407804310321808}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"language":[1,47],"models":[2,48],"are":[3],"increasingly":[4],"deployed":[5],"in":[6,45,93,102,142],"settings":[7],"where":[8],"relevant":[9],"information":[10],"is":[11,149],"embedded":[12],"within":[13],"long":[14,172],"and":[15,55,144],"noisy":[16],"contexts.":[17],"Despite":[18],"this,":[19],"robustness":[20,44,143,159],"to":[21,84,118,152],"growing":[22],"context":[23,66,75,89,105,135,153],"length":[24,67,90,106],"remains":[25],"poorly":[26],"understood":[27],"across":[28],"different":[29],"question":[30],"answering":[31],"tasks.":[32,121],"In":[33,122],"this":[34],"work,":[35],"we":[36],"present":[37],"a":[38,62,99],"controlled":[39],"empirical":[40],"study":[41],"of":[42,64,73,88,131],"context-length":[43,158],"large":[46],"using":[49],"two":[50],"widely":[51],"used":[52],"benchmarks:":[53],"SQuAD":[54,132],"HotpotQA.":[56],"We":[57,155],"evaluate":[58],"model":[59,166],"accuracy":[60,129],"as":[61,104],"function":[63],"total":[65],"by":[68],"systematically":[69],"increasing":[70],"the":[71,78,86,128],"amount":[72],"irrelevant":[74],"while":[76],"preserving":[77],"answer-bearing":[79],"signal.":[80],"This":[81],"allows":[82],"us":[83],"isolate":[85],"effect":[87],"from":[91],"changes":[92],"task":[94],"difficulty.":[95],"Our":[96],"results":[97],"show":[98],"consistent":[100],"degradation":[101,130],"performance":[103],"increases,":[107],"with":[108],"substantially":[109],"larger":[110],"drops":[111],"observed":[112],"on":[113],"multi-hop":[114,147],"reasoning":[115,148],"tasks":[116],"compared":[117],"single-span":[119],"extraction":[120],"particular,":[123],"HotpotQA":[124],"exhibits":[125],"nearly":[126],"twice":[127],"under":[133],"equivalent":[134],"expansions.":[136],"These":[137],"findings":[138],"highlight":[139],"task-dependent":[140],"differences":[141],"suggest":[145],"that":[146,157],"especially":[150,168],"vulnerable":[151],"dilution.":[154],"argue":[156],"should":[160],"be":[161],"evaluated":[162],"explicitly":[163],"when":[164],"assessing":[165],"reliability,":[167],"for":[169],"applications":[170],"involving":[171],"documents":[173],"or":[174],"retrieval-augmented":[175],"generation.":[176]},"counts_by_year":[],"updated_date":"2026-03-20T20:54:20.808490","created_date":"2026-03-20T00:00:00"}
