{"id":"https://openalex.org/W7128609912","doi":"https://doi.org/10.48550/arxiv.2602.09616","title":"With Argus Eyes: Assessing Retrieval Gaps via Uncertainty Scoring to Detect and Remedy Retrieval Blind Spots","display_name":"With Argus Eyes: Assessing Retrieval Gaps via Uncertainty Scoring to Detect and Remedy Retrieval Blind Spots","publication_year":2026,"publication_date":"2026-02-10","ids":{"openalex":"https://openalex.org/W7128609912","doi":"https://doi.org/10.48550/arxiv.2602.09616"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.09616","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5029008194","display_name":"Zeinab Taghavi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Taghavi, Zeinab Sadat","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125679383","display_name":"Ali Modarressi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Modarressi, Ali","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125671105","display_name":"Hinrich Schutze","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Schutze, Hinrich","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5125631816","display_name":"Andreas Marfurt","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Marfurt, Andreas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.7789000272750854,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.7789000272750854,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.11649999767541885,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.04580000042915344,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.5837000012397766},{"id":"https://openalex.org/keywords/argus","display_name":"Argus","score":0.5371000170707703},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.421099990606308},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.400299996137619},{"id":"https://openalex.org/keywords/trustworthiness","display_name":"Trustworthiness","score":0.399399995803833},{"id":"https://openalex.org/keywords/blind-spot","display_name":"Blind spot","score":0.3959999978542328}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7369999885559082},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.5837000012397766},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5575000047683716},{"id":"https://openalex.org/C2776760603","wikidata":"https://www.wikidata.org/wiki/Q3622471","display_name":"Argus","level":2,"score":0.5371000170707703},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5120000243186951},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.421099990606308},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.400299996137619},{"id":"https://openalex.org/C153701036","wikidata":"https://www.wikidata.org/wiki/Q659974","display_name":"Trustworthiness","level":2,"score":0.399399995803833},{"id":"https://openalex.org/C64731932","wikidata":"https://www.wikidata.org/wiki/Q371090","display_name":"Blind spot","level":2,"score":0.3959999978542328},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3707999885082245},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.35280001163482666},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.30640000104904175},{"id":"https://openalex.org/C161156560","wikidata":"https://www.wikidata.org/wiki/Q1638872","display_name":"Document retrieval","level":2,"score":0.3046000003814697},{"id":"https://openalex.org/C182407805","wikidata":"https://www.wikidata.org/wiki/Q2626534","display_name":"Substring","level":3,"score":0.3034999966621399},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.30000001192092896},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2946999967098236},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.2711000144481659},{"id":"https://openalex.org/C42058472","wikidata":"https://www.wikidata.org/wiki/Q810214","display_name":"Base (topology)","level":2,"score":0.26249998807907104}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.09616","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.09616","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.09616","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.09616","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Reliable":[0],"retrieval-augmented":[1],"generation":[2],"(RAG)":[3],"systems":[4,23,201],"depend":[5],"fundamentally":[6],"on":[7,155],"the":[8,31,40,47,52,68,131],"retriever's":[9],"ability":[10],"to":[11,33,39,46,61,64],"find":[12],"relevant":[13,38],"information.":[14],"We":[15,50],"show":[16,96,160],"that":[17,36,55,97,129,161,188],"neural":[18],"retrievers":[19,103,169],"used":[20],"in":[21,72,101,150,182],"RAG":[22,200],"have":[24,43],"blind":[25,58,98,122,191],"spots,":[26,123],"which":[27],"we":[28,95,124],"define":[29],"as":[30],"failure":[32],"retrieve":[34],"entities":[35,60,136],"are":[37],"query,":[41],"but":[42],"low":[44,73],"similarity":[45],"query":[48],"embedding.":[49],"investigate":[51],"training-induced":[53],"biases":[54],"cause":[56],"such":[57],"spot":[59,99],"be":[62,108],"mapped":[63],"inaccessible":[65],"parts":[66],"of":[67,86,133,148],"embedding":[69,113],"space,":[70],"resulting":[71],"retrievability.":[74],"Using":[75],"a":[76,127,142],"large-scale":[77],"dataset":[78],"constructed":[79],"from":[80,111,141],"Wikidata":[81],"relations":[82],"and":[83,88,158,173,198,203],"first":[84,146],"paragraphs":[85,147],"Wikipedia,":[87,149],"our":[89,151],"proposed":[90],"Retrieval":[91],"Probability":[92],"Score":[93],"(RPS),":[94],"risk":[100],"standard":[102],"(e.g.,":[104],"CONTRIEVER,":[105],"REASONIR)":[106],"can":[107],"predicted":[109],"pre-index":[110],"entity":[112],"geometry,":[114],"avoiding":[115],"expensive":[116],"retrieval":[117],"evaluations.":[118],"To":[119],"address":[120],"these":[121],"introduce":[125],"ARGUS,":[126],"pipeline":[128],"enables":[130],"retrievability":[132],"high-risk":[134],"(low-RPS)":[135],"through":[137],"targeted":[138],"document":[139],"augmentation":[140],"knowledge":[143],"base":[144],"(KB),":[145],"case.":[152],"Extensive":[153],"experiments":[154],"BRIGHT,":[156],"IMPLIRET,":[157],"RAR-B":[159],"ARGUS":[162],"achieves":[163],"consistent":[164],"improvements":[165],"across":[166],"all":[167],"evaluated":[168],"(averaging":[170],"+3.4":[171],"nDCG@5":[172],"+4.5":[174],"nDCG@10":[175],"absolute":[176],"points),":[177],"with":[178],"substantially":[179],"larger":[180],"gains":[181],"challenging":[183],"subsets.":[184],"These":[185],"results":[186],"establish":[187],"preemptively":[189],"remedying":[190],"spots":[192],"is":[193],"critical":[194],"for":[195],"building":[196],"robust":[197],"trustworthy":[199],"(Code":[202],"Data).":[204]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-02-12T00:00:00"}
