{"id":"https://openalex.org/W7114889968","doi":"https://doi.org/10.3390/bdcc9120320","title":"A Systematic Literature Review of Retrieval-Augmented Generation: Techniques, Metrics, and Challenges","display_name":"A Systematic Literature Review of Retrieval-Augmented Generation: Techniques, Metrics, and Challenges","publication_year":2025,"publication_date":"2025-12-12","ids":{"openalex":"https://openalex.org/W7114889968","doi":"https://doi.org/10.3390/bdcc9120320"},"language":"en","primary_location":{"id":"doi:10.3390/bdcc9120320","is_oa":true,"landing_page_url":"https://doi.org/10.3390/bdcc9120320","pdf_url":"https://www.mdpi.com/2504-2289/9/12/320/pdf","source":{"id":"https://openalex.org/S4210238752","display_name":"Big Data and Cognitive Computing","issn_l":"2504-2289","issn":["2504-2289"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Big Data and Cognitive Computing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/2504-2289/9/12/320/pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Andrew Brown","orcid":"https://orcid.org/0009-0004-9250-9038"},"institutions":[{"id":"https://openalex.org/I126231945","display_name":"Queen's University Belfast","ror":"https://ror.org/00hswnk62","country_code":"GB","type":"education","lineage":["https://openalex.org/I126231945"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Andrew Brown","raw_affiliation_strings":["Advanced Research and Engineering Centre (ARC), Queen\u2019s University Belfast, Belfast BT7 1NN, UK"],"affiliations":[{"raw_affiliation_string":"Advanced Research and Engineering Centre (ARC), Queen\u2019s University Belfast, Belfast BT7 1NN, UK","institution_ids":["https://openalex.org/I126231945"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Muhammad Roman","orcid":"https://orcid.org/0000-0002-9035-2426"},"institutions":[{"id":"https://openalex.org/I126231945","display_name":"Queen's University Belfast","ror":"https://ror.org/00hswnk62","country_code":"GB","type":"education","lineage":["https://openalex.org/I126231945"]},{"id":"https://openalex.org/I178777954","display_name":"Kohat University of Science and Technology","ror":"https://ror.org/057d2v504","country_code":"PK","type":"education","lineage":["https://openalex.org/I178777954"]}],"countries":["GB","PK"],"is_corresponding":false,"raw_author_name":"Muhammad Roman","raw_affiliation_strings":["Advanced Research and Engineering Centre (ARC), Queen\u2019s University Belfast, Belfast BT7 1NN, UK","Institute of Computing (IoC), Kohat University of Science & Technology (KUST), Kohat 26000, Pakistan"],"affiliations":[{"raw_affiliation_string":"Advanced Research and Engineering Centre (ARC), Queen\u2019s University Belfast, Belfast BT7 1NN, UK","institution_ids":["https://openalex.org/I126231945"]},{"raw_affiliation_string":"Institute of Computing (IoC), Kohat University of Science & Technology (KUST), Kohat 26000, Pakistan","institution_ids":["https://openalex.org/I178777954"]}]},{"author_position":"last","author":{"id":null,"display_name":"Barry Devereux","orcid":"https://orcid.org/0000-0003-2128-8632"},"institutions":[{"id":"https://openalex.org/I126231945","display_name":"Queen's University Belfast","ror":"https://ror.org/00hswnk62","country_code":"GB","type":"education","lineage":["https://openalex.org/I126231945"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Barry Devereux","raw_affiliation_strings":["Advanced Research and Engineering Centre (ARC), Queen\u2019s University Belfast, Belfast BT7 1NN, UK"],"affiliations":[{"raw_affiliation_string":"Advanced Research and Engineering Centre (ARC), Queen\u2019s University Belfast, Belfast BT7 1NN, UK","institution_ids":["https://openalex.org/I126231945"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I126231945"],"apc_list":{"value":1400,"currency":"CHF","value_usd":1515},"apc_paid":{"value":1400,"currency":"CHF","value_usd":1515},"fwci":6.4989,"has_fulltext":true,"cited_by_count":3,"citation_normalized_percentile":{"value":0.968,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"9","issue":"12","first_page":"320","last_page":"320"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12553","display_name":"Psychedelics and Drug Studies","score":0.14010000228881836,"subfield":{"id":"https://openalex.org/subfields/3203","display_name":"Clinical Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12553","display_name":"Psychedelics and Drug Studies","score":0.14010000228881836,"subfield":{"id":"https://openalex.org/subfields/3203","display_name":"Clinical Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12607","display_name":"Personal Information Management and User Behavior","score":0.08799999952316284,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10576","display_name":"Opioid Use Disorder Treatment","score":0.0430000014603138,"subfield":{"id":"https://openalex.org/subfields/2739","display_name":"Public Health, Environmental and Occupational Health"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/systematic-review","display_name":"Systematic review","score":0.6480000019073486},{"id":"https://openalex.org/keywords/citation","display_name":"Citation","score":0.642799973487854},{"id":"https://openalex.org/keywords/limiting","display_name":"Limiting","score":0.5239999890327454},{"id":"https://openalex.org/keywords/empirical-research","display_name":"Empirical research","score":0.400299996137619},{"id":"https://openalex.org/keywords/descriptive-statistics","display_name":"Descriptive statistics","score":0.32019999623298645},{"id":"https://openalex.org/keywords/citation-analysis","display_name":"Citation analysis","score":0.28540000319480896}],"concepts":[{"id":"https://openalex.org/C189708586","wikidata":"https://www.wikidata.org/wiki/Q1504425","display_name":"Systematic review","level":3,"score":0.6480000019073486},{"id":"https://openalex.org/C2778805511","wikidata":"https://www.wikidata.org/wiki/Q1713","display_name":"Citation","level":2,"score":0.642799973487854},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.5264000296592712},{"id":"https://openalex.org/C188198153","wikidata":"https://www.wikidata.org/wiki/Q1613840","display_name":"Limiting","level":2,"score":0.5239999890327454},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.46470001339912415},{"id":"https://openalex.org/C120936955","wikidata":"https://www.wikidata.org/wiki/Q2155640","display_name":"Empirical research","level":2,"score":0.400299996137619},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.3474000096321106},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.34290000796318054},{"id":"https://openalex.org/C39896193","wikidata":"https://www.wikidata.org/wiki/Q380344","display_name":"Descriptive statistics","level":2,"score":0.32019999623298645},{"id":"https://openalex.org/C539667460","wikidata":"https://www.wikidata.org/wiki/Q2414942","display_name":"Management science","level":1,"score":0.290800005197525},{"id":"https://openalex.org/C105345328","wikidata":"https://www.wikidata.org/wiki/Q206276","display_name":"Citation analysis","level":3,"score":0.28540000319480896},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.28369998931884766},{"id":"https://openalex.org/C166052673","wikidata":"https://www.wikidata.org/wiki/Q83021","display_name":"Empirical evidence","level":2,"score":0.2743000090122223},{"id":"https://openalex.org/C100253034","wikidata":"https://www.wikidata.org/wiki/Q196372","display_name":"Systematic error","level":2,"score":0.2662999927997589},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.265500009059906},{"id":"https://openalex.org/C513874922","wikidata":"https://www.wikidata.org/wiki/Q212805","display_name":"Digital library","level":3,"score":0.26080000400543213},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.25940001010894775},{"id":"https://openalex.org/C509550671","wikidata":"https://www.wikidata.org/wiki/Q126945","display_name":"Medical education","level":1,"score":0.2549999952316284}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.3390/bdcc9120320","is_oa":true,"landing_page_url":"https://doi.org/10.3390/bdcc9120320","pdf_url":"https://www.mdpi.com/2504-2289/9/12/320/pdf","source":{"id":"https://openalex.org/S4210238752","display_name":"Big Data and Cognitive Computing","issn_l":"2504-2289","issn":["2504-2289"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Big Data and Cognitive Computing","raw_type":"journal-article"},{"id":"pmh:oai:pure.qub.ac.uk/portal:openaire/4b181d3c-5b1b-4380-b5f7-85ba9c38ea4d","is_oa":true,"landing_page_url":"https://pure.qub.ac.uk/en/publications/4b181d3c-5b1b-4380-b5f7-85ba9c38ea4d","pdf_url":null,"source":{"id":"https://openalex.org/S4306402319","display_name":"Research Portal (Queen's University Belfast)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I126231945","host_organization_name":"Queen's University Belfast","host_organization_lineage":["https://openalex.org/I126231945"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Brown, A, Roman, M & Devereux, B 2025, 'A systematic literature review of retrieval-augmented generation: techniques, metrics, and challenges', Big Data and Cognitive Computing, vol. 9, no. 12, 320. https://doi.org/10.3390/bdcc9120320","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:doaj.org/article:c928715e303f4258864e2b3d549b26ce","is_oa":true,"landing_page_url":"https://doaj.org/article/c928715e303f4258864e2b3d549b26ce","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Big Data and Cognitive Computing, Vol 9, Iss 12, p 320 (2025)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.3390/bdcc9120320","is_oa":true,"landing_page_url":"https://doi.org/10.3390/bdcc9120320","pdf_url":"https://www.mdpi.com/2504-2289/9/12/320/pdf","source":{"id":"https://openalex.org/S4210238752","display_name":"Big Data and Cognitive Computing","issn_l":"2504-2289","issn":["2504-2289"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Big Data and Cognitive Computing","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320314204","display_name":"Invest Northern Ireland","ror":"https://ror.org/00qnrsq87"},{"id":"https://openalex.org/F4320320357","display_name":"Queen's University Belfast","ror":"https://ror.org/00hswnk62"},{"id":"https://openalex.org/F4320320859","display_name":"Ulster University","ror":"https://ror.org/01yp9g959"},{"id":"https://openalex.org/F4320321832","display_name":"Queen's University","ror":"https://ror.org/02y72wh86"},{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W7114889968.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Background:":[0],"Retrieval-augmented":[1],"generation":[2],"(RAG)":[3],"aims":[4],"to":[5,34,158,166,175,186,223,268,280,289],"reduce":[6],"hallucinations":[7],"and":[8,26,47,50,59,76,115,125,146,177,190,210,233,251,255,278,283,301,307,314,332,340],"outdated":[9],"knowledge":[10],"by":[11,172,326,333],"grounding":[12,282],"LLM":[13,148],"outputs":[14],"in":[15,61],"retrieved":[16],"evidence,":[17],"but":[18],"empirical":[19,36],"results":[20],"are":[21,260],"scattered":[22],"across":[23],"tasks,":[24],"systems,":[25,291],"metrics,":[27],"limiting":[28],"cumulative":[29],"insight.":[30],"Objective:":[31],"We":[32,66,161,193,318],"aimed":[33],"synthesise":[35,167],"evidence":[37,321],"on":[38,83],"RAG":[39,96,226],"effectiveness":[40],"versus":[41],"parametric-only":[42],"baselines,":[43],"map":[44],"datasets/architectures/evaluation":[45],"practices,":[46],"surface":[48],"limitations":[49],"research":[51],"gaps.":[52],"Methods:":[53],"This":[54,87],"systematic":[55],"review":[56],"was":[57,132,183],"conducted":[58],"reported":[60],"accordance":[62],"with":[63,134,142,227,240,299],"PRISMA":[64],"2020.":[65],"searched":[67,82],"the":[68,168,320,329],"ACM":[69],"Digital":[70],"Library,":[71],"IEEE":[72],"Xplore,":[73],"Scopus,":[74],"ScienceDirect,":[75],"DBLP;":[77],"all":[78],"sources":[79],"were":[80,150,156],"last":[81],"13":[84],"May":[85],"2025.":[86],"included":[88,194],"studies":[89,171,196],"from":[90,218,287,328],"January":[91],"2020\u2013May":[92],"2025":[93,153],"that":[94,311],"addressed":[95],"or":[97,113],"similar":[98],"retrieval-supported":[99],"systems":[100],"producing":[101],"text":[102],"output,":[103],"met":[104],"citation":[105,154],"thresholds":[106,155,331],"(\u226515":[107],"for":[108,111],"2025;":[109],"\u226530":[110],"2024":[112],"earlier),":[114],"offered":[116],"original":[117],"contributions;":[118],"excluded":[119],"non-English":[120],"items,":[121],"irrelevant":[122],"works,":[123],"duplicates,":[124],"records":[126],"without":[127],"accessible":[128],"full":[129],"text.":[130],"Bias":[131],"appraised":[133],"a":[135,163,266],"brief":[136],"checklist;":[137],"screening":[138],"used":[139,162],"one":[140],"reviewer":[141],"an":[143],"independent":[144],"check":[145],"discussion.":[147],"suggestions":[149],"advisory":[151],"only;":[152],"adjusted":[157],"limit":[159],"citation-lag.":[160],"descriptive":[164],"approach":[165],"results,":[169],"organising":[170],"themes":[173],"aligned":[174],"RQ1\u2013RQ4":[176],"reporting":[178],"summary":[179],"counts/frequencies;":[180],"no":[181],"meta-analysis":[182],"undertaken":[184],"due":[185],"heterogeneity":[187],"of":[188,243],"designs":[189],"metrics.":[191],"Results:":[192],"128":[195],"spanning":[197],"knowledge-intensive":[198],"tasks":[199],"(35/128;":[200],"27.3%),":[201],"open-domain":[202],"QA":[203],"(20/128;":[204],"15.6%),":[205],"software":[206],"engineering":[207],"(13/128;":[208],"10.2%),":[209],"medical":[211],"domains":[212],"(11/128;":[213],"8.6%).":[214],"Methods":[215],"have":[216],"shifted":[217],"DPR":[219],"+":[220],"seq2seq":[221],"baselines":[222],"modular,":[224,269],"policy-driven":[225,270],"hybrid/structure-aware":[228,273],"retrieval,":[229,274],"uncertainty-triggered":[230],"loops,":[231],"memory,":[232,277],"emerging":[234],"multimodality.":[235],"Evaluation":[236],"remains":[237],"overlap-heavy":[238],"(EM/F1),":[239],"increasing":[241],"use":[242],"retrieval":[244],"diagnostics":[245],"(e.g.,":[246],"Recall@k,":[247],"MRR@k),":[248],"human":[249],"judgements,":[250],"LLM-as-judge":[252],"protocols.":[253],"Efficiency":[254],"security":[256],"(poisoning,":[257],"leakage,":[258],"jailbreaks)":[259],"growing":[261],"concerns.":[262],"Discussion:":[263],"Evidence":[264],"supports":[265],"shift":[267],"RAG,":[271],"combining":[272],"uncertainty-aware":[275],"control,":[276],"multimodality,":[279],"improve":[281],"efficiency.":[284],"To":[285],"advance":[286],"prototypes":[288],"dependable":[290],"we":[292],"recommend:":[293],"(i)":[294],"holistic":[295],"benchmarks":[296],"pairing":[297],"quality":[298],"cost/latency":[300],"safety,":[302],"(ii)":[303],"budget-aware":[304],"retrieval/tool-use":[305],"policies,":[306],"(iii)":[308],"provenance-aware":[309],"pipelines":[310],"expose":[312],"uncertainty":[313],"deliver":[315],"traceable":[316],"evidence.":[317],"note":[319],"base":[322],"may":[323],"be":[324],"affected":[325],"citation-lag":[327],"inclusion":[330],"English-only,":[334],"five-library":[335],"coverage.":[336],"Funding:":[337],"Advanced":[338],"Research":[339],"Engineering":[341],"Centre.":[342],"Registration:":[343],"Not":[344],"registered.":[345]},"counts_by_year":[{"year":2026,"cited_by_count":3}],"updated_date":"2026-04-11T08:14:18.477133","created_date":"2025-12-12T00:00:00"}
