{"id":"https://openalex.org/W7106230846","doi":"https://doi.org/10.1109/tsc.2025.3635384","title":"SageCopilot: An LLM-Empowered Autonomous Agent for Data Science as a Service","display_name":"SageCopilot: An LLM-Empowered Autonomous Agent for Data Science as a Service","publication_year":2025,"publication_date":"2025-11-21","ids":{"openalex":"https://openalex.org/W7106230846","doi":"https://doi.org/10.1109/tsc.2025.3635384"},"language":null,"primary_location":{"id":"doi:10.1109/tsc.2025.3635384","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tsc.2025.3635384","pdf_url":null,"source":{"id":"https://openalex.org/S204223317","display_name":"IEEE Transactions on Services Computing","issn_l":"1939-1374","issn":["1939-1374","2372-0204"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Services Computing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Yuan Liao","orcid":"https://orcid.org/0009-0008-4826-7886"},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yuan Liao","raw_affiliation_strings":["Baidu, Inc., Beijing, China"],"affiliations":[{"raw_affiliation_string":"Baidu, Inc., Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Jiang Bian","orcid":null},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiang Bian","raw_affiliation_strings":["Baidu, Inc., Beijing, China"],"affiliations":[{"raw_affiliation_string":"Baidu, Inc., Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Yuhui Yun","orcid":"https://orcid.org/0009-0000-9726-1861"},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuhui Yun","raw_affiliation_strings":["Baidu, Inc., Beijing, China"],"affiliations":[{"raw_affiliation_string":"Baidu, Inc., Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Shuo Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuo Wang","raw_affiliation_strings":["Baidu, Inc., Beijing, China"],"affiliations":[{"raw_affiliation_string":"Baidu, Inc., Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Yubo Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yubo Zhang","raw_affiliation_strings":["Beihang University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Jiaming Chu","orcid":"https://orcid.org/0000-0002-3040-3674"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiaming Chu","raw_affiliation_strings":["Beijing University of Posts and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Tao Wang","orcid":"https://orcid.org/0000-0003-4740-6932"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tao Wang","raw_affiliation_strings":["Beijing University of Posts and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Yuchen Li","orcid":"https://orcid.org/0000-0002-3869-7881"},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuchen Li","raw_affiliation_strings":["Baidu, Inc., Beijing, China"],"affiliations":[{"raw_affiliation_string":"Baidu, Inc., Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Xuhong Li","orcid":"https://orcid.org/0000-0002-2582-8256"},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xuhong Li","raw_affiliation_strings":["Baidu, Inc., Beijing, China"],"affiliations":[{"raw_affiliation_string":"Baidu, Inc., Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Shilei Ji","orcid":"https://orcid.org/0009-0001-4443-0294"},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shilei Ji","raw_affiliation_strings":["Baidu, Inc., Beijing, China"],"affiliations":[{"raw_affiliation_string":"Baidu, Inc., Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]},{"author_position":"last","author":{"id":null,"display_name":"Haoyi Xiong","orcid":"https://orcid.org/0000-0002-5451-3253"},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haoyi Xiong","raw_affiliation_strings":["Baidu, Inc., Beijing, China"],"affiliations":[{"raw_affiliation_string":"Baidu, Inc., Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":11,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I98301712"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.58059649,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"19","issue":"1","first_page":"642","last_page":"656"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10799","display_name":"Data Visualization and Analytics","score":0.13979999721050262,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10799","display_name":"Data Visualization and Analytics","score":0.13979999721050262,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.08240000158548355,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.0763000026345253,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/executable","display_name":"Executable","score":0.7559999823570251},{"id":"https://openalex.org/keywords/scripting-language","display_name":"Scripting language","score":0.7092000246047974},{"id":"https://openalex.org/keywords/correctness","display_name":"Correctness","score":0.583299994468689},{"id":"https://openalex.org/keywords/sql","display_name":"SQL","score":0.5309000015258789},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.5252000093460083},{"id":"https://openalex.org/keywords/data-manipulation-language","display_name":"Data manipulation language","score":0.4880000054836273},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.4575999975204468},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.4223000109195709},{"id":"https://openalex.org/keywords/automation","display_name":"Automation","score":0.4066999852657318}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8950999975204468},{"id":"https://openalex.org/C160145156","wikidata":"https://www.wikidata.org/wiki/Q778586","display_name":"Executable","level":2,"score":0.7559999823570251},{"id":"https://openalex.org/C61423126","wikidata":"https://www.wikidata.org/wiki/Q187432","display_name":"Scripting language","level":2,"score":0.7092000246047974},{"id":"https://openalex.org/C55439883","wikidata":"https://www.wikidata.org/wiki/Q360812","display_name":"Correctness","level":2,"score":0.583299994468689},{"id":"https://openalex.org/C510870499","wikidata":"https://www.wikidata.org/wiki/Q47607","display_name":"SQL","level":2,"score":0.5309000015258789},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.5252000093460083},{"id":"https://openalex.org/C56288433","wikidata":"https://www.wikidata.org/wiki/Q58673","display_name":"Data manipulation language","level":2,"score":0.4880000054836273},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.4575999975204468},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.4223000109195709},{"id":"https://openalex.org/C115901376","wikidata":"https://www.wikidata.org/wiki/Q184199","display_name":"Automation","level":2,"score":0.4066999852657318},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.38440001010894775},{"id":"https://openalex.org/C172367668","wikidata":"https://www.wikidata.org/wiki/Q6504956","display_name":"Data visualization","level":3,"score":0.3743000030517578},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.36419999599456787},{"id":"https://openalex.org/C67463725","wikidata":"https://www.wikidata.org/wiki/Q17081452","display_name":"Natural language programming","level":5,"score":0.3601999878883362},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.3449000120162964},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.33570000529289246},{"id":"https://openalex.org/C174252522","wikidata":"https://www.wikidata.org/wiki/Q3816772","display_name":"Natural language user interface","level":3,"score":0.3257000148296356},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.32510000467300415},{"id":"https://openalex.org/C2780378061","wikidata":"https://www.wikidata.org/wiki/Q25351891","display_name":"Service (business)","level":2,"score":0.32499998807907104},{"id":"https://openalex.org/C179603123","wikidata":"https://www.wikidata.org/wiki/Q1941921","display_name":"Modeling language","level":3,"score":0.3197000026702881},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.3181999921798706},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.2946999967098236},{"id":"https://openalex.org/C100463513","wikidata":"https://www.wikidata.org/wiki/Q5227322","display_name":"Data model (GIS)","level":2,"score":0.28200000524520874},{"id":"https://openalex.org/C110875604","wikidata":"https://www.wikidata.org/wiki/Q75","display_name":"The Internet","level":2,"score":0.2777000069618225},{"id":"https://openalex.org/C19024347","wikidata":"https://www.wikidata.org/wiki/Q211496","display_name":"High-level programming language","level":3,"score":0.27619999647140503},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.26930001378059387},{"id":"https://openalex.org/C2779439875","wikidata":"https://www.wikidata.org/wiki/Q1078276","display_name":"Natural language understanding","level":3,"score":0.2671999931335449},{"id":"https://openalex.org/C5655090","wikidata":"https://www.wikidata.org/wiki/Q192588","display_name":"Relational database","level":2,"score":0.2662999927997589},{"id":"https://openalex.org/C35578498","wikidata":"https://www.wikidata.org/wiki/Q193424","display_name":"Web service","level":2,"score":0.2628999948501587},{"id":"https://openalex.org/C89505385","wikidata":"https://www.wikidata.org/wiki/Q47146","display_name":"User interface","level":2,"score":0.25589999556541443}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tsc.2025.3635384","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tsc.2025.3635384","pdf_url":null,"source":{"id":"https://openalex.org/S204223317","display_name":"IEEE Transactions on Services Computing","issn_l":"1939-1374","issn":["1939-1374","2372-0204"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Services Computing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","score":0.43082717061042786,"id":"https://metadata.un.org/sdg/9"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":8,"referenced_works":["https://openalex.org/W2610221865","https://openalex.org/W2803317679","https://openalex.org/W3034835156","https://openalex.org/W3106221893","https://openalex.org/W3200079259","https://openalex.org/W4312238419","https://openalex.org/W4385562710","https://openalex.org/W4385573003"],"related_works":[],"abstract_inverted_index":{"While":[0],"the":[1,30,54,92,137],"field":[2],"of":[3],"natural":[4,14],"language":[5,15],"to":[6,82,95,140],"SQL(NL2SQL)":[7],"has":[8],"made":[9],"significant":[10],"advancements":[11],"in":[12],"translating":[13],"instructions":[16],"into":[17,99],"executable":[18,100],"SQL":[19],"scripts":[20,101],"for":[21,102,123],"data":[22,32,35,55],"querying":[23],"and":[24,39,67,106,116,147],"processing,":[25],"achieving":[26],"full":[27],"automation":[28],"within":[29],"broader":[31],"science":[33,56],"pipeline\u2013encompassing":[34],"querying,":[36],"analysis,":[37,105],"visualization,":[38],"reporting\u2013remains":[40],"a":[41,74],"complex":[42],"challenge.":[43],"This":[44],"study":[45],"introduces":[46],"SageCopilot,":[47],"an":[48,79],"advanced,":[49],"industry-grade":[50],"system":[51],"that":[52],"automates":[53],"pipeline":[57],"by":[58],"integrating":[59],"Large":[60],"Language":[61,68],"Models":[62],"(LLMs),":[63],"Autonomous":[64],"Agents":[65],"(AutoAgents),":[66],"User":[69],"Interfaces":[70],"(LUIs).":[71],"Designed":[72],"with":[73,133],"two-phase":[75],"architecture,":[76],"SageCopilot":[77,126],"uses":[78],"offline":[80],"phase":[81,94],"generate":[83],"high-quality":[84],"demonstrations":[85],"supporting":[86],"In-Context":[87],"Learning":[88],"(ICL),":[89],"which":[90],"powers":[91],"online":[93],"transform":[96],"user":[97],"inputs":[98],"database":[103],"queries,":[104],"visualization":[107],"tasks.":[108],"Leveraging":[109],"specialized":[110],"components":[111],"such":[112],"as":[113,118,120],"NL2SQL,":[114],"Text2Analyze,":[115],"Text2Viz,":[117],"well":[119],"chain-of-thought":[121],"prompting":[122],"multi-turn":[124],"interactions,":[125],"achieves":[127],"superior":[128],"end-to-end":[129],"automation.":[130],"Rigorous":[131],"experimentation":[132],"real-world":[134],"datasets":[135],"demonstrates":[136],"system's":[138],"ability":[139],"minimize":[141],"human":[142],"intervention":[143],"while":[144],"ensuring":[145],"correctness":[146],"user-friendly":[148],"operation.":[149]},"counts_by_year":[],"updated_date":"2026-02-09T05:59:30.833894","created_date":"2025-11-23T00:00:00"}
