{"id":"https://openalex.org/W7134111356","doi":"https://doi.org/10.1109/bigdata66926.2025.11402159","title":"An Agentic Data System for Analyzing Heterogeneous Data","display_name":"An Agentic Data System for Analyzing Heterogeneous Data","publication_year":2025,"publication_date":"2025-12-08","ids":{"openalex":"https://openalex.org/W7134111356","doi":"https://doi.org/10.1109/bigdata66926.2025.11402159"},"language":null,"primary_location":{"id":"doi:10.1109/bigdata66926.2025.11402159","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata66926.2025.11402159","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Big Data (BigData)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Guoliang Li","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Guoliang Li","raw_affiliation_strings":["Tsinghua University"],"affiliations":[{"raw_affiliation_string":"Tsinghua University","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.87292939,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"2","last_page":"2"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.04270000010728836,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.04270000010728836,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10456","display_name":"Multi-Agent Systems and Negotiation","score":0.03519999980926514,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14082","display_name":"Modeling, Simulation, and Optimization","score":0.033399999141693115,"subfield":{"id":"https://openalex.org/subfields/2607","display_name":"Discrete Mathematics and Combinatorics"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/data-system","display_name":"Data system","score":0.3068999946117401},{"id":"https://openalex.org/keywords/data-collection","display_name":"Data collection","score":0.29660001397132874},{"id":"https://openalex.org/keywords/information-system","display_name":"Information system","score":0.27160000801086426},{"id":"https://openalex.org/keywords/data-modeling","display_name":"Data modeling","score":0.26910001039505005},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.2612000107765198},{"id":"https://openalex.org/keywords/data-analysis","display_name":"Data analysis","score":0.25760000944137573}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6086000204086304},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3522999882698059},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3269999921321869},{"id":"https://openalex.org/C203481301","wikidata":"https://www.wikidata.org/wiki/Q76221","display_name":"Data system","level":2,"score":0.3068999946117401},{"id":"https://openalex.org/C133462117","wikidata":"https://www.wikidata.org/wiki/Q4929239","display_name":"Data collection","level":2,"score":0.29660001397132874},{"id":"https://openalex.org/C180198813","wikidata":"https://www.wikidata.org/wiki/Q121182","display_name":"Information system","level":2,"score":0.27160000801086426},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.26910001039505005},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.2612000107765198},{"id":"https://openalex.org/C175801342","wikidata":"https://www.wikidata.org/wiki/Q1988917","display_name":"Data analysis","level":2,"score":0.25760000944137573},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.25699999928474426},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.2565000057220459},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.2547000050544739}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigdata66926.2025.11402159","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata66926.2025.11402159","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Big Data (BigData)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/13","score":0.4201991856098175,"display_name":"Climate action"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Current":[0],"systems":[1],"for":[2,97],"analyzing":[3,48],"unstructured":[4,50],"data":[5,34,53,86],"often":[6],"depend":[7],"heavily":[8],"on":[9,152],"experts":[10],"to":[11,18,40,89,107,120],"code":[12],"and":[13,21,51,74,102,111,123,134,148],"manage":[14,108],"complex":[15],"workflows,":[16],"leading":[17],"high":[19],"costs":[20],"significant":[22],"time":[23],"consumption.":[24],"To":[25],"address":[26],"these":[27],"challenges,":[28],"we":[29,115],"introduce":[30,116],"AgenticData,":[31],"an":[32],"agentic":[33],"analytics":[35],"system":[36],"that":[37,64,83,139],"allows":[38],"users":[39],"submit":[41],"natural":[42],"language":[43],"(NL)":[44],"queries":[45,68],"while":[46],"autonomously":[47],"both":[49],"structured":[52],"across":[54],"various":[55],"domains.":[56],"AgenticData":[57,130,140],"starts":[58],"with":[59],"a":[60,79,85,93,103],"feedback-driven":[61],"planning":[62],"approach":[63],"automatically":[65],"converts":[66],"NL":[67],"into":[69],"semantic":[70,75,94,117,125],"plans":[71],"containing":[72],"relational":[73],"operators.":[76],"We":[77,127],"propose":[78],"multi-agent":[80],"collaboration":[81],"strategy":[82],"includes":[84],"profiling":[87],"agent":[88,96,106],"identify":[90],"relevant":[91],"data,":[92],"cross-validation":[95],"iterative":[98],"optimization":[99,118],"using":[100,131],"feedback,":[101],"smart":[104],"memory":[105],"short-term":[109],"context":[110],"long-term":[112],"knowledge.":[113],"Additionally,":[114],"techniques":[119],"efficiently":[121],"refine":[122],"execute":[124],"plans.":[126],"have":[128],"evaluated":[129],"five":[132],"benchmarks,":[133],"the":[135],"experimental":[136],"results":[137],"showed":[138],"delivers":[141],"superior":[142],"accuracy,":[143],"significantly":[144],"outperforming":[145],"state-of-the-art":[146],"methods":[147],"achieving":[149],"top":[150],"positions":[151],"two":[153],"well-known":[154],"leaderboards.":[155]},"counts_by_year":[],"updated_date":"2026-03-25T23:56:10.502304","created_date":"2026-03-08T00:00:00"}
