{"id":"https://openalex.org/W7161782089","doi":"https://doi.org/10.48550/arxiv.2605.19735","title":"ContextRAG: Extraction-Free Hierarchical Graph Construction for Retrieval-Augmented Generation","display_name":"ContextRAG: Extraction-Free Hierarchical Graph Construction for Retrieval-Augmented Generation","publication_year":2026,"publication_date":"2026-05-19","ids":{"openalex":"https://openalex.org/W7161782089","doi":"https://doi.org/10.48550/arxiv.2605.19735"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.19735","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.19735","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.19735","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5136592710","display_name":"Roman Prosvirnin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Prosvirnin, Roman","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001647280","display_name":"\u0421\u0435\u0440\u0433\u0435\u0439 \u041a\u0443\u0437\u043d\u0435\u0446\u043e\u0432","orcid":"https://orcid.org/0000-0002-8257-028X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kuznetsov, Sergei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5026203914","display_name":"Seungmin Jin","orcid":"https://orcid.org/0000-0002-8242-6157"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jin, Seungmin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.5913000106811523,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.5913000106811523,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.13660000264644623,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.07289999723434448,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.607200026512146},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5217999815940857},{"id":"https://openalex.org/keywords/fuzzy-logic","display_name":"Fuzzy logic","score":0.3873000144958496},{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.3783000111579895},{"id":"https://openalex.org/keywords/graph-database","display_name":"Graph database","score":0.37119999527931213},{"id":"https://openalex.org/keywords/directed-graph","display_name":"Directed graph","score":0.3601999878883362}],"concepts":[{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.607200026512146},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5914999842643738},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.553600013256073},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5217999815940857},{"id":"https://openalex.org/C58166","wikidata":"https://www.wikidata.org/wiki/Q224821","display_name":"Fuzzy logic","level":2,"score":0.3873000144958496},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.3783000111579895},{"id":"https://openalex.org/C176225458","wikidata":"https://www.wikidata.org/wiki/Q595971","display_name":"Graph database","level":3,"score":0.37119999527931213},{"id":"https://openalex.org/C146380142","wikidata":"https://www.wikidata.org/wiki/Q1137726","display_name":"Directed graph","level":2,"score":0.3601999878883362},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.3447999954223633},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3434999883174896},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3287999927997589},{"id":"https://openalex.org/C62611344","wikidata":"https://www.wikidata.org/wiki/Q1062658","display_name":"Node (physics)","level":2,"score":0.3212999999523163},{"id":"https://openalex.org/C17169500","wikidata":"https://www.wikidata.org/wiki/Q3033506","display_name":"Null graph","level":5,"score":0.3068999946117401},{"id":"https://openalex.org/C64339825","wikidata":"https://www.wikidata.org/wiki/Q722659","display_name":"Graph property","level":5,"score":0.2919999957084656},{"id":"https://openalex.org/C106937863","wikidata":"https://www.wikidata.org/wiki/Q7236518","display_name":"Power graph analysis","level":3,"score":0.28540000319480896},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.26460000872612},{"id":"https://openalex.org/C53811970","wikidata":"https://www.wikidata.org/wiki/Q5062194","display_name":"Centrality","level":2,"score":0.25529998540878296}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.19735","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.19735","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.19735","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.19735","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Graph-structured":[0],"retrieval-augmented":[1],"generation":[2],"(RAG)":[3],"systems":[4,15],"can":[5],"improve":[6],"answer":[7],"quality":[8],"on":[9,17,131,158],"multi-hop":[10,159],"questions,":[11],"but":[12],"many":[13],"current":[14],"rely":[16],"large":[18],"language":[19],"models":[20],"(LLMs)":[21],"to":[22,142],"extract":[23],"entities,":[24],"relations,":[25],"and":[26,34,72,81,91,113,128,155],"summaries":[27],"during":[28,137],"indexing.":[29],"These":[30],"calls":[31,112,127],"add":[32],"token":[33],"wall-clock":[35],"costs":[36],"that":[37,165,184],"grow":[38],"with":[39,76,109],"corpus":[40],"size.":[41],"We":[42],"present":[43],"ContextRAG,":[44],"a":[45,62,101,118,132],"graph":[46,50,65,98,138],"RAG":[47],"system":[48],"whose":[49],"topology":[51],"is":[52,189],"constructed":[53],"without":[54],"LLM-based":[55],"entity":[56],"or":[57],"relation":[58],"extraction.":[59],"ContextRAG":[60,105,150],"derives":[61],"fuzzy":[63,89],"concept":[64],"over":[66,146,182],"chunk":[67],"embeddings":[68],"using":[69],"residual-quantization":[70],"k-means":[71],"Formal":[73],"Concept":[74],"Analysis":[75],"Lukasiewicz":[77],"residuated":[78],"logic.":[79],"Bridge-like":[80],"meet-derived":[82],"context":[83],"nodes":[84],"are":[85],"induced":[86],"by":[87,96],"soft":[88],"join":[90],"meet":[92],"operations,":[93],"rather":[94,191],"than":[95,192],"LLM-written":[97],"edges.":[99],"On":[100],"130-task":[102],"UltraDomain":[103],"subset,":[104],"builds":[106],"its":[107],"index":[108],"30":[110],"LLM":[111],"22,073":[114],"tokens.":[115,149],"In":[116],"contrast,":[117],"local":[119],"HiRAG":[120],"reproduction":[121],"stress":[122],"test":[123],"required":[124],"870":[125],"indexing":[126,148],"3.54M":[129],"tokens":[130],"20-task":[133],"subset":[134],"before":[135],"failing":[136],"construction;":[139],"linear":[140],"extrapolation":[141],"130":[143],"tasks":[144],"implies":[145],"23M":[147],"obtains":[151],"33.6%":[152],"F1":[153,157,181],"overall":[154],"36.8%":[156],"tasks.":[160],"An":[161],"activation":[162],"analysis":[163],"shows":[164],"queries":[166,183],"retrieving":[167],"at":[168],"least":[169],"one":[170],"lattice-derived":[171],"node":[172],"in":[173],"the":[174],"top":[175],"five":[176],"achieve":[177],"+3.9":[178],"percentage":[179],"points":[180],"do":[185],"not;":[186],"this":[187],"association":[188],"diagnostic":[190],"causal.":[193]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-21T00:00:00"}
