{"id":"https://openalex.org/W7134836697","doi":"https://doi.org/10.48550/arxiv.2603.08329","title":"SPD-RAG: Sub-Agent Per Document Retrieval-Augmented Generation","display_name":"SPD-RAG: Sub-Agent Per Document Retrieval-Augmented Generation","publication_year":2026,"publication_date":"2026-03-09","ids":{"openalex":"https://openalex.org/W7134836697","doi":"https://doi.org/10.48550/arxiv.2603.08329"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2603.08329","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5128639518","display_name":"Yagiz Can Akay","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Akay, Yagiz Can","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Kartal, Muhammed Yusuf","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kartal, Muhammed Yusuf","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128655423","display_name":"Esra Alparslan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alparslan, Esra","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128675517","display_name":"Faruk Ortakoyluoglu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ortakoyluoglu, Faruk","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5128672031","display_name":"Arda Akpinar","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Akpinar, Arda","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.8529000282287598,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.8529000282287598,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.06440000236034393,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.014999999664723873,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.7163000106811523},{"id":"https://openalex.org/keywords/question-answering","display_name":"Question answering","score":0.6916000247001648},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5473999977111816},{"id":"https://openalex.org/keywords/layer","display_name":"Layer (electronics)","score":0.4390999972820282},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.39809998869895935},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.37860000133514404},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.3716000020503998}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7875000238418579},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.7163000106811523},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.6916000247001648},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5473999977111816},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4860000014305115},{"id":"https://openalex.org/C2779227376","wikidata":"https://www.wikidata.org/wiki/Q6505497","display_name":"Layer (electronics)","level":2,"score":0.4390999972820282},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4074999988079071},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.39809998869895935},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.37860000133514404},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.3716000020503998},{"id":"https://openalex.org/C161156560","wikidata":"https://www.wikidata.org/wiki/Q1638872","display_name":"Document retrieval","level":2,"score":0.32339999079704285},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.31630000472068787},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.31040000915527344},{"id":"https://openalex.org/C189950617","wikidata":"https://www.wikidata.org/wiki/Q937228","display_name":"Property (philosophy)","level":2,"score":0.2930000126361847},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.29260000586509705},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.28360000252723694},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.2800000011920929},{"id":"https://openalex.org/C9357733","wikidata":"https://www.wikidata.org/wiki/Q6878417","display_name":"Missing data","level":2,"score":0.2547000050544739},{"id":"https://openalex.org/C2776207758","wikidata":"https://www.wikidata.org/wiki/Q5303302","display_name":"Downstream (manufacturing)","level":2,"score":0.25360000133514404},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.25270000100135803}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2603.08329","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2603.08329","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.08329","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2603.08329","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Answering":[0],"complex,":[1],"real-world":[2],"queries":[3],"often":[4],"requires":[5],"synthesizing":[6],"facts":[7],"scattered":[8],"across":[9],"vast":[10],"document":[11,57,60],"corpora.":[12],"In":[13],"these":[14],"settings,":[15],"standard":[16],"retrieval-augmented":[17],"generation":[18],"(RAG)":[19],"pipelines":[20],"suffer":[21],"from":[22],"incomplete":[23],"evidence":[24],"coverage,":[25],"while":[26,77,125,159],"long-context":[27,139],"large":[28],"language":[29],"models":[30],"(LLMs)":[31],"struggle":[32],"to":[33,82],"reason":[34],"reliably":[35],"over":[36],"massive":[37,108],"inputs.":[38],"We":[39],"introduce":[40],"SPD-RAG,":[41],"a":[42,64,78,99,127,168],"hierarchical":[43],"multi-agent":[44],"framework":[45],"for":[46,107,138],"exhaustive":[47],"cross-document":[48],"question":[49],"answering":[50],"that":[51],"decomposes":[52],"the":[53,56,133,164],"problem":[54],"along":[55],"axis.":[58],"Each":[59],"is":[61],"processed":[62],"by":[63,94],"dedicated":[65],"document-level":[66,111],"agent":[67],"operating":[68],"only":[69,161],"on":[70],"its":[71],"own":[72],"content,":[73],"enabling":[74],"focused":[75],"retrieval,":[76],"coordinator":[79],"dispatches":[80],"tasks":[81],"relevant":[83],"agents":[84],"and":[85,118,155],"aggregates":[86],"their":[87],"partial":[88,96],"answers.":[89],"Agent":[90],"outputs":[91],"are":[92],"synthesized":[93],"merging":[95],"answers":[97],"through":[98],"token-bounded":[100],"synthesis":[101],"layer":[102],"(which":[103],"supports":[104],"recursive":[105],"map-reduce":[106],"corpora).":[109],"This":[110],"specialization":[112],"with":[113],"centralized":[114],"fusion":[115],"improves":[116],"scalability":[117],"answer":[119],"quality":[120],"in":[121],"heterogeneous":[122],"multidocument":[123],"settings":[124],"yielding":[126],"modular,":[128],"extensible":[129],"retrieval":[130],"pipeline.":[131],"On":[132],"LOONG":[134],"benchmark":[135],"(EMNLP":[136],"2024)":[137],"multi-document":[140],"QA,":[141],"SPD-RAG":[142],"achieves":[143],"an":[144],"Avg":[145],"Score":[146],"of":[147,163,167],"58.1":[148],"(GPT-5":[149],"evaluation),":[150],"outperforming":[151],"Normal":[152],"RAG":[153,157],"(33.0)":[154],"Agentic":[156],"(32.8)":[158],"using":[160],"38%":[162],"API":[165],"cost":[166],"full-context":[169],"baseline":[170],"(68.0).":[171]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-11T00:00:00"}
