{"id":"https://openalex.org/W4414921206","doi":"https://doi.org/10.1145/3774904.3792589","title":"GraphRAG-R1: Graph Retrieval-Augmented Generation with Process-Constrained Reinforcement Learning","display_name":"GraphRAG-R1: Graph Retrieval-Augmented Generation with Process-Constrained Reinforcement Learning","publication_year":2026,"publication_date":"2026-04-09","ids":{"openalex":"https://openalex.org/W4414921206","doi":"https://doi.org/10.1145/3774904.3792589"},"language":"en","primary_location":{"id":"doi:10.1145/3774904.3792589","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3774904.3792589","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM Web Conference 2026","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3774904.3792589","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5077784388","display_name":"Caiyang Yu","orcid":null},"institutions":[{"id":"https://openalex.org/I205237279","display_name":"Nankai University","ror":"https://ror.org/01y1kjr75","country_code":"CN","type":"education","lineage":["https://openalex.org/I205237279"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chuanyue Yu","raw_affiliation_strings":["Nankai University, Binhai New Area, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"Nankai University, Binhai New Area, Tianjin, China","institution_ids":["https://openalex.org/I205237279"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008349845","display_name":"Kuo Zhao","orcid":"https://orcid.org/0000-0002-7030-0338"},"institutions":[{"id":"https://openalex.org/I205237279","display_name":"Nankai University","ror":"https://ror.org/01y1kjr75","country_code":"CN","type":"education","lineage":["https://openalex.org/I205237279"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kuo Zhao","raw_affiliation_strings":["Nankai University, Binhai New Area, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"Nankai University, Binhai New Area, Tianjin, China","institution_ids":["https://openalex.org/I205237279"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100332392","display_name":"Yuhan Li","orcid":"https://orcid.org/0000-0001-6741-2833"},"institutions":[{"id":"https://openalex.org/I200769079","display_name":"Hong Kong University of Science and Technology","ror":"https://ror.org/00q4vv597","country_code":"HK","type":"education","lineage":["https://openalex.org/I200769079"]},{"id":"https://openalex.org/I889458895","display_name":"University of Hong Kong","ror":"https://ror.org/02zhqgq86","country_code":"HK","type":"education","lineage":["https://openalex.org/I889458895"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Yuhan Li","raw_affiliation_strings":["HKUST Guangzhou, Guangzhou, Guangdong, China"],"affiliations":[{"raw_affiliation_string":"HKUST Guangzhou, Guangzhou, Guangdong, China","institution_ids":["https://openalex.org/I200769079","https://openalex.org/I889458895"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027050251","display_name":"Heng Chang","orcid":"https://orcid.org/0000-0002-4978-8041"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]},{"id":"https://openalex.org/I4210160618","display_name":"Huawei Technologies (United Kingdom)","ror":"https://ror.org/056gzgs71","country_code":"GB","type":"company","lineage":["https://openalex.org/I2250955327","https://openalex.org/I4210160618"]}],"countries":["CN","GB"],"is_corresponding":false,"raw_author_name":"Heng Chang","raw_affiliation_strings":["Huawei Technologies Ltd, Haidian District, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Huawei Technologies Ltd, Haidian District, Beijing, China","institution_ids":["https://openalex.org/I2250955327","https://openalex.org/I4210160618"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112947020","display_name":"Mingjian Feng","orcid":null},"institutions":[{"id":"https://openalex.org/I205237279","display_name":"Nankai University","ror":"https://ror.org/01y1kjr75","country_code":"CN","type":"education","lineage":["https://openalex.org/I205237279"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mingjian Feng","raw_affiliation_strings":["Nankai University, Binhai New Area, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"Nankai University, Binhai New Area, Tianjin, China","institution_ids":["https://openalex.org/I205237279"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031312235","display_name":"Xiangzhe Jiang","orcid":null},"institutions":[{"id":"https://openalex.org/I205237279","display_name":"Nankai University","ror":"https://ror.org/01y1kjr75","country_code":"CN","type":"education","lineage":["https://openalex.org/I205237279"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiangzhe Jiang","raw_affiliation_strings":["Nankai University, Binhai New Area, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"Nankai University, Binhai New Area, Tianjin, China","institution_ids":["https://openalex.org/I205237279"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101411542","display_name":"Yufei Sun","orcid":"https://orcid.org/0009-0000-0896-0610"},"institutions":[{"id":"https://openalex.org/I205237279","display_name":"Nankai University","ror":"https://ror.org/01y1kjr75","country_code":"CN","type":"education","lineage":["https://openalex.org/I205237279"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yufei Sun","raw_affiliation_strings":["Nankai University, Binhai New Area, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"Nankai University, Binhai New Area, Tianjin, China","institution_ids":["https://openalex.org/I205237279"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103240065","display_name":"Jia Li","orcid":"https://orcid.org/0000-0001-6111-7518"},"institutions":[{"id":"https://openalex.org/I4210159029","display_name":"Guangzhou HKUST Fok Ying Tung Research Institute","ror":"https://ror.org/05cvbj479","country_code":"CN","type":"facility","lineage":["https://openalex.org/I200769079","https://openalex.org/I4210159029"]},{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]},{"id":"https://openalex.org/I889458895","display_name":"University of Hong Kong","ror":"https://ror.org/02zhqgq86","country_code":"HK","type":"education","lineage":["https://openalex.org/I889458895"]}],"countries":["CN","HK"],"is_corresponding":false,"raw_author_name":"Jia Li","raw_affiliation_strings":["Beihang University, Haidian District, Beijing, China","HKUST Guangzhou, Guangzhou, Guandong, China"],"affiliations":[{"raw_affiliation_string":"Beihang University, Haidian District, Beijing, China","institution_ids":["https://openalex.org/I82880672"]},{"raw_affiliation_string":"HKUST Guangzhou, Guangzhou, Guandong, China","institution_ids":["https://openalex.org/I4210159029","https://openalex.org/I889458895"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100657058","display_name":"Yuzhi Zhang","orcid":"https://orcid.org/0000-0002-6729-925X"},"institutions":[{"id":"https://openalex.org/I205237279","display_name":"Nankai University","ror":"https://ror.org/01y1kjr75","country_code":"CN","type":"education","lineage":["https://openalex.org/I205237279"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuzhi Zhang","raw_affiliation_strings":["Nankai University, Binhai New Area, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"Nankai University, Binhai New Area, Tianjin, China","institution_ids":["https://openalex.org/I205237279"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Qingyun Sun","orcid":"https://orcid.org/0000-0003-1930-3848"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qingyun Sun","raw_affiliation_strings":["Beihang University, Haidian District, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beihang University, Haidian District, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100442619","display_name":"Ziwei Zhang","orcid":"https://orcid.org/0000-0003-2451-843X"},"institutions":[{"id":"https://openalex.org/I4210159029","display_name":"Guangzhou HKUST Fok Ying Tung Research Institute","ror":"https://ror.org/05cvbj479","country_code":"CN","type":"facility","lineage":["https://openalex.org/I200769079","https://openalex.org/I4210159029"]},{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]},{"id":"https://openalex.org/I889458895","display_name":"University of Hong Kong","ror":"https://ror.org/02zhqgq86","country_code":"HK","type":"education","lineage":["https://openalex.org/I889458895"]}],"countries":["CN","HK"],"is_corresponding":false,"raw_author_name":"Jianxin Li","raw_affiliation_strings":["Beihang University, Haidian District, Beijing, China","HKUST Guangzhou, Guangzhou, Guandong, China"],"affiliations":[{"raw_affiliation_string":"Beihang University, Haidian District, Beijing, China","institution_ids":["https://openalex.org/I82880672"]},{"raw_affiliation_string":"HKUST Guangzhou, Guangzhou, Guandong, China","institution_ids":["https://openalex.org/I4210159029","https://openalex.org/I889458895"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100442619","display_name":"Ziwei Zhang","orcid":"https://orcid.org/0000-0003-2451-843X"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ziwei Zhang","raw_affiliation_strings":["Beihang University, Haidian District, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beihang University, Haidian District, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":12,"corresponding_author_ids":["https://openalex.org/A5077784388"],"corresponding_institution_ids":["https://openalex.org/I205237279"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.00448894,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1398","last_page":"1409"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9810000061988831,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12292","display_name":"Graph Theory and Algorithms","score":0.9789000153541565,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.659500002861023},{"id":"https://openalex.org/keywords/heuristics","display_name":"Heuristics","score":0.65420001745224},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5432000160217285},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.4749999940395355},{"id":"https://openalex.org/keywords/knowledge-representation-and-reasoning","display_name":"Knowledge representation and reasoning","score":0.33180001378059387}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7423999905586243},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.659500002861023},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.65420001745224},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5519999861717224},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5432000160217285},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5005999803543091},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.4749999940395355},{"id":"https://openalex.org/C161301231","wikidata":"https://www.wikidata.org/wiki/Q3478658","display_name":"Knowledge representation and reasoning","level":2,"score":0.33180001378059387},{"id":"https://openalex.org/C20162079","wikidata":"https://www.wikidata.org/wiki/Q1151406","display_name":"Case-based reasoning","level":2,"score":0.30309998989105225},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.29919999837875366},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.2890999913215637}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1145/3774904.3792589","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3774904.3792589","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM Web Conference 2026","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2507.23581","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2507.23581","pdf_url":"https://arxiv.org/pdf/2507.23581","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:doi:10.48550/arxiv.2507.23581","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2507.23581","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2507.23581","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.1145/3774904.3792589","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3774904.3792589","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM Web Conference 2026","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Graph":[0],"Retrieval-Augmented":[1],"Generation":[2],"(GraphRAG)":[3],"has":[4],"shown":[5],"great":[6],"effectiveness":[7],"in":[8,234],"enhancing":[9],"the":[10,63,90,130,141,160,172,221],"reasoning":[11,64,92,222,237],"abilities":[12],"of":[13,66,118],"Large":[14],"Language":[15],"Models":[16],"(LLMs)":[17],"by":[18,79],"leveraging":[19],"graph":[20],"structures":[21],"for":[22],"knowledge":[23],"representation":[24],"and":[25,49,58,108,193,206,247],"modeling":[26],"complex":[27,40,98,236],"real-world":[28],"relationships.":[29],"However,":[30],"existing":[31,259],"GraphRAG":[32,77,200,242],"methods":[33,243],"still":[34],"face":[35],"significant":[36],"bottlenecks":[37],"when":[38],"handling":[39],"problems":[41,238],"that":[42,124,228],"require":[43],"multi-hop":[44,91],"reasoning,":[45],"as":[46],"their":[47],"query":[48],"retrieval":[50,102,143,218,260],"phases":[51],"are":[52],"largely":[53],"based":[54],"on":[55,244],"pre-defined":[56],"heuristics":[57],"do":[59],"not":[60],"fully":[61],"utilize":[62,114],"potentials":[65],"LLMs.":[67],"To":[68,139],"address":[69],"this":[70],"problem,":[71,144,162],"we":[72,113,133,145,163],"propose":[73],"GraphRAG-R1,":[74],"an":[75],"adaptive":[76],"framework":[78,252],"training":[80,183,187],"LLMs":[81],"with":[82,175,201,257],"process-constrained":[83,136],"outcome-based":[84],"reinforcement":[85],"learning":[86],"(RL)":[87],"to":[88,104,128,153,158,170,190,219,240],"enhance":[89],"ability.":[93],"Our":[94],"method":[95,213],"can":[96,253],"decompose":[97],"problems,":[99],"autonomously":[100],"invoke":[101],"tools":[103],"acquire":[105],"necessary":[106],"information,":[107],"perform":[109],"effective":[110],"reasoning.":[111],"Specifically,":[112],"a":[115,147,165,181,215],"modified":[116],"version":[117],"Group":[119],"Relative":[120],"Policy":[121],"Optimization":[122],"(GRPO)":[123],"supports":[125],"rollout-with-thinking":[126],"capability":[127],"train":[129],"model.":[131],"Next,":[132],"design":[134,146,164,180],"two":[135,195],"reward":[137,152,169],"functions.":[138],"handle":[140,159],"shallow":[142],"Progressive":[148],"Retrieval":[149],"Attenuation":[150],"(PRA)":[151],"encourage":[154],"essential":[155],"retrievals.":[156],"Then,":[157],"over-thinking":[161],"Cost-Aware":[166],"F1":[167],"(CAF)":[168],"balance":[171],"model":[173],"performance":[174,264],"computational":[176],"costs.":[177],"We":[178],"further":[179],"phase-dependent":[182],"strategy,":[184],"containing":[185],"three":[186],"stages":[188,198],"corresponding":[189],"cold":[191],"start":[192],"these":[194],"rewards.":[196],"These":[197],"empower":[199],"format":[202],"following,":[203],"behavior":[204],"shaping,":[205],"smartness":[207],"optimization":[208],"abilities,":[209],"respectively.":[210],"Lastly,":[211],"our":[212,251],"adopts":[214],"hybrid":[216],"graph-textual":[217],"improve":[220],"capacity.":[223],"Extensive":[224],"experimental":[225],"results":[226],"demonstrate":[227],"GraphRAG-R1":[229],"significantly":[230],"boosts":[231],"LLM":[232],"capabilities":[233],"solving":[235],"compared":[239],"state-of-the-art":[241],"both":[245],"in-domain":[246],"out-of-domain":[248],"datasets.":[249],"Furthermore,":[250],"be":[254],"flexibly":[255],"integrated":[256],"various":[258],"methods,":[261],"consistently":[262],"delivering":[263],"improvements.":[265]},"counts_by_year":[],"updated_date":"2026-04-16T08:26:57.006410","created_date":"2025-10-10T00:00:00"}
