{"id":"https://openalex.org/W4399912398","doi":"https://doi.org/10.48550/arxiv.2406.13121","title":"Can Long-Context Language Models Subsume Retrieval, RAG, SQL, and More?","display_name":"Can Long-Context Language Models Subsume Retrieval, RAG, SQL, and More?","publication_year":2024,"publication_date":"2024-06-19","ids":{"openalex":"https://openalex.org/W4399912398","doi":"https://doi.org/10.48550/arxiv.2406.13121"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2406.13121","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2406.13121","pdf_url":"https://arxiv.org/pdf/2406.13121","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2406.13121","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5002413587","display_name":"Jinhyuk Lee","orcid":"https://orcid.org/0000-0003-4972-239X"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Lee, Jinhyuk","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087171054","display_name":"Anthony Chen","orcid":"https://orcid.org/0000-0003-4363-5041"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Anthony","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062633736","display_name":"Zhuyun Dai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dai, Zhuyun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076846819","display_name":"Dheeru Dua","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dua, Dheeru","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000168915","display_name":"Devendra Singh Sachan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sachan, Devendra Singh","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062977994","display_name":"Michael Boratko","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Boratko, Michael","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074697516","display_name":"Yi Luan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Luan, Yi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040494793","display_name":"S\u00e9bastien M. R. Arnold","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Arnold, S\u00e9bastien M. R.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005123194","display_name":"Vincent Perot","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Perot, Vincent","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068873086","display_name":"Siddharth Dalmia","orcid":"https://orcid.org/0000-0003-0437-5988"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dalmia, Siddharth","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065708799","display_name":"Hexiang Hu","orcid":"https://orcid.org/0000-0002-4720-169X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Hexiang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017578261","display_name":"Xudong Lin","orcid":"https://orcid.org/0000-0001-5479-4414"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lin, Xudong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035867340","display_name":"Panupong Pasupat","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pasupat, Panupong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034305203","display_name":"Aida Amini","orcid":"https://orcid.org/0000-0002-0576-5147"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Amini, Aida","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090951421","display_name":"Jeremy R. Cole","orcid":"https://orcid.org/0000-0001-7147-5888"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cole, Jeremy R.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101404695","display_name":"Sebastian Riedel","orcid":"https://orcid.org/0000-0002-3655-2486"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Riedel, Sebastian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033760431","display_name":"Iftekhar Naim","orcid":"https://orcid.org/0000-0002-2119-3273"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Naim, Iftekhar","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076904467","display_name":"Ming\u2010Wei Chang","orcid":"https://orcid.org/0000-0002-0137-8895"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chang, Ming-Wei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5076669462","display_name":"Kelvin Guu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guu, Kelvin","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":19,"corresponding_author_ids":["https://openalex.org/A5002413587"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.983299970626831,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.983299970626831,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9797000288963318,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6728766560554504},{"id":"https://openalex.org/keywords/sql","display_name":"SQL","score":0.6696729063987732},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.647195041179657},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.45082777738571167},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.419497013092041},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.35106098651885986},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3336403965950012},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.3236100971698761},{"id":"https://openalex.org/keywords/history","display_name":"History","score":0.21452713012695312},{"id":"https://openalex.org/keywords/philosophy","display_name":"Philosophy","score":0.08297476172447205},{"id":"https://openalex.org/keywords/archaeology","display_name":"Archaeology","score":0.07434681057929993}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6728766560554504},{"id":"https://openalex.org/C510870499","wikidata":"https://www.wikidata.org/wiki/Q47607","display_name":"SQL","level":2,"score":0.6696729063987732},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.647195041179657},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.45082777738571167},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.419497013092041},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.35106098651885986},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3336403965950012},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.3236100971698761},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.21452713012695312},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.08297476172447205},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.07434681057929993}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2406.13121","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2406.13121","pdf_url":"https://arxiv.org/pdf/2406.13121","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2406.13121","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2406.13121","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2406.13121","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2406.13121","pdf_url":"https://arxiv.org/pdf/2406.13121","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4399912398.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2003932708","https://openalex.org/W1967424056","https://openalex.org/W2284877871","https://openalex.org/W2138102289","https://openalex.org/W868043274","https://openalex.org/W2513523087","https://openalex.org/W1187916458","https://openalex.org/W2373861055","https://openalex.org/W1559716973","https://openalex.org/W3109364360"],"abstract_inverted_index":{"Long-context":[0],"language":[1],"models":[2],"(LCLMs)":[3],"have":[4],"the":[5,43,64,71,149],"potential":[6,169],"to":[7,11,26,90,95,110,170],"revolutionize":[8],"our":[9],"approach":[10],"tasks":[12,86,177],"traditionally":[13],"reliant":[14],"on":[15,99],"external":[16],"tools":[17],"like":[18,133],"retrieval":[19,101,113],"systems":[20],"or":[21],"databases.":[22],"Leveraging":[23],"LCLMs'":[24,97,107],"ability":[25,109],"natively":[27],"ingest":[28],"and":[29,61,102,114,174],"process":[30],"entire":[31,72],"corpora":[32],"of":[33,48,66,84,92],"information":[34],"offers":[35],"numerous":[36],"advantages.":[37],"It":[38],"enhances":[39],"user-friendliness":[40],"by":[41],"eliminating":[42],"need":[44,150],"for":[45,63,123,151,165],"specialized":[46],"knowledge":[47],"tools,":[49],"provides":[50,160],"robust":[51],"end-to-end":[52],"modeling":[53],"that":[54,136],"minimizes":[55],"cascading":[56],"errors":[57],"in":[58,131,139],"complex":[59],"pipelines,":[60],"allows":[62],"application":[65],"sophisticated":[67],"prompting":[68,143],"techniques":[69],"across":[70],"system.":[73],"To":[74],"assess":[75],"this":[76],"paradigm":[77],"shift,":[78],"we":[79],"introduce":[80],"LOFT,":[81],"a":[82,161],"benchmark":[83],"real-world":[85],"requiring":[87],"context":[88,155],"up":[89],"millions":[91],"tokens":[93],"designed":[94],"evaluate":[96],"performance":[98],"in-context":[100],"reasoning.":[103],"Our":[104],"findings":[105],"reveal":[106],"surprising":[108],"rival":[111],"state-of-the-art":[112],"RAG":[115],"systems,":[116],"despite":[117],"never":[118],"having":[119],"been":[120],"explicitly":[121],"trained":[122],"these":[124],"tasks.":[125,141],"However,":[126],"LCLMs":[127],"still":[128],"face":[129],"challenges":[130],"areas":[132],"compositional":[134],"reasoning":[135],"are":[137],"required":[138],"SQL-like":[140],"Notably,":[142],"strategies":[144],"significantly":[145],"influence":[146],"performance,":[147],"emphasizing":[148],"continued":[152],"research":[153],"as":[154,178],"lengths":[156],"grow.":[157],"Overall,":[158],"LOFT":[159],"rigorous":[162],"testing":[163],"ground":[164],"LCLMs,":[166],"showcasing":[167],"their":[168],"supplant":[171],"existing":[172],"paradigms":[173],"tackle":[175],"novel":[176],"model":[179],"capabilities":[180],"scale.":[181]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1}],"updated_date":"2026-02-09T09:26:11.010843","created_date":"2025-10-10T00:00:00"}
