{"id":"https://openalex.org/W4406461112","doi":"https://doi.org/10.1109/bigdata62323.2024.10825910","title":"ERATTA: Extreme RAG for enterprise-Table To Answers with Large Language Models","display_name":"ERATTA: Extreme RAG for enterprise-Table To Answers with Large Language Models","publication_year":2024,"publication_date":"2024-12-15","ids":{"openalex":"https://openalex.org/W4406461112","doi":"https://doi.org/10.1109/bigdata62323.2024.10825910"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata62323.2024.10825910","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata62323.2024.10825910","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Big Data (BigData)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101931962","display_name":"Sohini Roychowdhury","orcid":"https://orcid.org/0009-0008-7575-9333"},"institutions":[{"id":"https://openalex.org/I4210099672","display_name":"Accenture (United States)","ror":"https://ror.org/013g16z83","country_code":"US","type":"company","lineage":["https://openalex.org/I4210093804","https://openalex.org/I4210099672"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Sohini Roychowdhury","raw_affiliation_strings":["Accenture,Corporate Data and Analytics Office (CDAO),USA"],"affiliations":[{"raw_affiliation_string":"Accenture,Corporate Data and Analytics Office (CDAO),USA","institution_ids":["https://openalex.org/I4210099672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059594013","display_name":"Marko Krema","orcid":null},"institutions":[{"id":"https://openalex.org/I4210099672","display_name":"Accenture (United States)","ror":"https://ror.org/013g16z83","country_code":"US","type":"company","lineage":["https://openalex.org/I4210093804","https://openalex.org/I4210099672"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Marko Krema","raw_affiliation_strings":["Accenture,Corporate Data and Analytics Office (CDAO),USA"],"affiliations":[{"raw_affiliation_string":"Accenture,Corporate Data and Analytics Office (CDAO),USA","institution_ids":["https://openalex.org/I4210099672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5097357210","display_name":"Anvar Mahammad","orcid":null},"institutions":[{"id":"https://openalex.org/I4210099672","display_name":"Accenture (United States)","ror":"https://ror.org/013g16z83","country_code":"US","type":"company","lineage":["https://openalex.org/I4210093804","https://openalex.org/I4210099672"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Anvar Mahammad","raw_affiliation_strings":["Accenture,Corporate Data and Analytics Office (CDAO),USA"],"affiliations":[{"raw_affiliation_string":"Accenture,Corporate Data and Analytics Office (CDAO),USA","institution_ids":["https://openalex.org/I4210099672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069591226","display_name":"Brian R. Moore","orcid":"https://orcid.org/0000-0002-9117-9792"},"institutions":[{"id":"https://openalex.org/I4210099672","display_name":"Accenture (United States)","ror":"https://ror.org/013g16z83","country_code":"US","type":"company","lineage":["https://openalex.org/I4210093804","https://openalex.org/I4210099672"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Brian Moore","raw_affiliation_strings":["Accenture,Corporate Data and Analytics Office (CDAO),USA"],"affiliations":[{"raw_affiliation_string":"Accenture,Corporate Data and Analytics Office (CDAO),USA","institution_ids":["https://openalex.org/I4210099672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031139197","display_name":"Arijit Mukherjee","orcid":"https://orcid.org/0000-0001-5052-4476"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Arijit Mukherjee","raw_affiliation_strings":["Accenture,CDAO,India"],"affiliations":[{"raw_affiliation_string":"Accenture,CDAO,India","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5097335714","display_name":"Punit Prakashchandra","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Punit Prakashchandra","raw_affiliation_strings":["Accenture,CDAO,India"],"affiliations":[{"raw_affiliation_string":"Accenture,CDAO,India","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5101931962"],"corresponding_institution_ids":["https://openalex.org/I4210099672"],"apc_list":null,"apc_paid":null,"fwci":1.5448,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.8622676,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"4605","last_page":"4610"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9915000200271606,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9879999756813049,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7077709436416626},{"id":"https://openalex.org/keywords/table","display_name":"Table (database)","score":0.5145992040634155},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.41672319173812866},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3210362195968628},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.18404516577720642}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7077709436416626},{"id":"https://openalex.org/C45235069","wikidata":"https://www.wikidata.org/wiki/Q278425","display_name":"Table (database)","level":2,"score":0.5145992040634155},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.41672319173812866},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3210362195968628},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.18404516577720642}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigdata62323.2024.10825910","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata62323.2024.10825910","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Big Data (BigData)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":10,"referenced_works":["https://openalex.org/W2072944755","https://openalex.org/W2890867094","https://openalex.org/W2962885446","https://openalex.org/W2963207291","https://openalex.org/W2963866663","https://openalex.org/W3009251324","https://openalex.org/W4387835442","https://openalex.org/W4388860683","https://openalex.org/W4391095288","https://openalex.org/W4399450508"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4394360958"],"abstract_inverted_index":{"Large":[0],"language":[1],"models":[2],"(LLMs)":[3],"with":[4,25,50],"retrieval":[5],"augmented-generation":[6],"(RAG)":[7],"have":[8,52],"been":[9,30,53],"the":[10,19,62,128,154,173,183],"optimal":[11],"choice":[12],"for":[13,41,94],"scalable":[14],"generative":[15],"AI":[16,26],"solutions":[17],"in":[18,112,123,134,153,172],"recent":[20],"past.":[21],"Although":[22],"RAG":[23,49,186],"implemented":[24],"agents":[27],"(agentic-RAG)":[28],"has":[29],"recently":[31],"popularized,":[32],"its":[33],"suffers":[34],"from":[35,97],"unstable":[36],"cost":[37],"and":[38,64,91,110,118,127,150,160,177],"unreliable":[39],"performances":[40],"Enterprise-level":[42,98],"data-practices.":[43],"Most":[44],"existing":[45],"use-cases":[46],"that":[47,148],"incorporate":[48],"LLMs":[51,80],"either":[54],"generic":[55],"or":[56],"extremely":[57],"domain":[58],"specific,":[59],"thereby":[60],"questioning":[61],"scalability":[63],"generalizability":[65],"of":[66,169],"RAG-LLM":[67],"approaches.":[68],"In":[69],"this":[70],"work,":[71],"we":[72,141],"propose":[73,142],"a":[74,143],"unique":[75],"LLM-based":[76],"system":[77,159],"where":[78],"multiple":[79],"can":[81,188],"be":[82],"invoked":[83],"to":[84,182],"enable":[85,189],"data":[86,99],"authentication,":[87],"user-query":[88],"routing,":[89],"data-retrieval":[90],"custom":[92],"prompting":[93],"question-answering":[95],"capabilities":[96],"tables":[100,105],"on":[101],"sustainability.":[102],"The":[103],"source":[104,191],"here":[106],"are":[107],"highly":[108],"fluctuating":[109],"large":[111],"size":[113],"storing":[114],"carbon":[115],"footprint,":[116],"energy":[117],"water":[119],"usage":[120],"at":[121],"buildings":[122],"regional":[124],"levels":[125],"globally":[126],"proposed":[129,158,184],"framework":[130],"enables":[131],"structured":[132],"responses":[133],"under":[135],"10":[136],"seconds":[137],"per":[138],"query.":[139],"Additionally,":[140],"five":[144],"metric":[145],"scoring":[146,161],"module":[147],"detects":[149],"reports":[151],"hallucinations":[152],"LLM":[155],"responses.":[156],"Our":[157],"metrics":[162],"achieve":[163],">90%":[164],"confidence":[165],"scores":[166],"across":[167],"hundreds":[168],"user":[170],"queries":[171],"sustainability,":[174],"financial":[175],"health":[176],"social":[178],"media":[179],"domains.":[180],"Extensions":[181],"extreme":[185],"architectures":[187],"heterogeneous":[190],"querying":[192],"using":[193],"LLMs.":[194]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
