{"id":"https://openalex.org/W7118015199","doi":"https://doi.org/10.48550/arxiv.2512.23737","title":"Governing Cloud Data Pipelines with Agentic AI","display_name":"Governing Cloud Data Pipelines with Agentic AI","publication_year":2025,"publication_date":"2025-12-24","ids":{"openalex":"https://openalex.org/W7118015199","doi":"https://doi.org/10.48550/arxiv.2512.23737"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2512.23737","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.23737","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2512.23737","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5120706330","display_name":"Aswathnarayan Muthukrishnan Kirubakaran","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Kirubakaran, Aswathnarayan Muthukrishnan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133771970","display_name":"Adithya Parthasarathy","orcid":"https://orcid.org/0009-0001-6839-9527"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Parthasarathy, Adithya","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026172990","display_name":"Nitin K. Saksena","orcid":"https://orcid.org/0000-0002-2431-9871"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Saksena, Nitin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121270376","display_name":"Ram Sekhar Bodala","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bodala, Ram Sekhar","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121273068","display_name":"Akshay Deshpande","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Deshpande, Akshay","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121265125","display_name":"Suhas Malempati","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Malempati, Suhas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121254325","display_name":"Shiva Kumar Reddy Carimireddy","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Carimireddy, Shiva","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5121268928","display_name":"Abhirup Mazumder","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mazumder, Abhirup","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5120706330"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.5920000076293945,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.5920000076293945,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.07729999721050262,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11614","display_name":"Cloud Data Security Solutions","score":0.04780000075697899,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.7922999858856201},{"id":"https://openalex.org/keywords/data-governance","display_name":"Data governance","score":0.6132000088691711},{"id":"https://openalex.org/keywords/orchestration","display_name":"Orchestration","score":0.5350000262260437},{"id":"https://openalex.org/keywords/pipeline-transport","display_name":"Pipeline transport","score":0.4284000098705292},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.41600000858306885},{"id":"https://openalex.org/keywords/resource","display_name":"Resource (disambiguation)","score":0.3959999978542328},{"id":"https://openalex.org/keywords/data-integrity","display_name":"Data integrity","score":0.3702999949455261}],"concepts":[{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.7922999858856201},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6564000248908997},{"id":"https://openalex.org/C196879817","wikidata":"https://www.wikidata.org/wiki/Q872685","display_name":"Data governance","level":4,"score":0.6132000088691711},{"id":"https://openalex.org/C199168358","wikidata":"https://www.wikidata.org/wiki/Q3367000","display_name":"Orchestration","level":3,"score":0.5350000262260437},{"id":"https://openalex.org/C175309249","wikidata":"https://www.wikidata.org/wiki/Q725864","display_name":"Pipeline transport","level":2,"score":0.4284000098705292},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.41600000858306885},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.3959999978542328},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.38929998874664307},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.3887999951839447},{"id":"https://openalex.org/C33762810","wikidata":"https://www.wikidata.org/wiki/Q461671","display_name":"Data integrity","level":2,"score":0.3702999949455261},{"id":"https://openalex.org/C39389867","wikidata":"https://www.wikidata.org/wiki/Q380767","display_name":"Corporate governance","level":2,"score":0.3418999910354614},{"id":"https://openalex.org/C79158427","wikidata":"https://www.wikidata.org/wiki/Q485396","display_name":"Analytics","level":2,"score":0.3278000056743622},{"id":"https://openalex.org/C175801342","wikidata":"https://www.wikidata.org/wiki/Q1988917","display_name":"Data analysis","level":2,"score":0.32510000467300415},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.32089999318122864},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.3075999915599823},{"id":"https://openalex.org/C52146309","wikidata":"https://www.wikidata.org/wiki/Q7431116","display_name":"Schema (genetic algorithms)","level":2,"score":0.3028999865055084},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.28290000557899475},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.28279998898506165},{"id":"https://openalex.org/C195094911","wikidata":"https://www.wikidata.org/wiki/Q14167904","display_name":"Process management","level":1,"score":0.2750000059604645},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.2685999870300293},{"id":"https://openalex.org/C2778505942","wikidata":"https://www.wikidata.org/wiki/Q18344624","display_name":"Microservices","level":3,"score":0.26489999890327454},{"id":"https://openalex.org/C153740404","wikidata":"https://www.wikidata.org/wiki/Q671224","display_name":"Data center","level":2,"score":0.2558000087738037}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2512.23737","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.23737","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2512.23737","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.23737","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Cloud":[0,49,73,124,145],"data":[1,69,178,199],"pipelines":[2,24,200],"increasingly":[3],"operate":[4],"under":[5],"dynamic":[6],"workloads,":[7],"evolving":[8],"schemas,":[9],"cost":[10,87,160],"constraints,":[11],"and":[12,29,41,64,82,88,91,103,118,131,164,180,193],"strict":[13],"governance":[14,63,113],"requirements.":[15],"Despite":[16],"advances":[17],"in":[18,34,201],"cloud-native":[19],"orchestration":[20],"frameworks,":[21],"most":[22],"production":[23],"rely":[25],"on":[26],"static":[27,174],"configurations":[28],"reactive":[30],"operational":[31,94,159],"practices,":[32],"resulting":[33],"prolonged":[35],"recovery":[36,152],"times,":[37],"inefficient":[38],"resource":[39,99],"utilization,":[40],"high":[42],"manual":[43,166],"overhead.":[44],"This":[45],"paper":[46],"presents":[47],"Agentic":[48,72,123,144],"Data":[50,74,125,146],"Engineering,":[51],"a":[52],"policy-aware":[53],"control":[54,65,189],"architecture":[55],"that":[56,143,186],"integrates":[57],"bounded":[58],"AI":[59],"agents":[60,78],"into":[61],"the":[62],"plane":[66],"of":[67],"cloud":[68,198],"pipelines.":[70],"In":[71],"Engineering":[75,126,147],"platform,":[76],"specialized":[77],"analyze":[79],"pipeline":[80,151],"telemetry":[81],"metadata,":[83],"reason":[84],"over":[85,170],"declarative":[86],"compliance":[89],"policies,":[90],"propose":[92],"constrained":[93],"actions":[95,109],"such":[96],"as":[97],"adaptive":[98],"reconfiguration,":[100],"schema":[101],"reconciliation,":[102],"automated":[104],"failure":[105],"recovery.":[106],"All":[107],"agent":[108],"are":[110],"validated":[111],"against":[112],"policies":[114],"to":[115,156,173],"ensure":[116],"predictable":[117],"auditable":[119],"behavior.":[120],"We":[121],"evaluate":[122],"platform":[127,148],"using":[128],"representative":[129],"batch":[130],"streaming":[132],"analytics":[133],"workloads":[134],"constructed":[135],"from":[136],"public":[137],"enterprise-style":[138],"datasets.":[139],"Experimental":[140],"results":[141,184],"show":[142],"reduces":[149],"mean":[150],"time":[153],"by":[154,161,169],"up":[155],"45%,":[157],"lowers":[158],"approximately":[162],"25%,":[163],"decreases":[165],"intervention":[167],"events":[168],"70%":[171],"compared":[172],"orchestration,":[175],"while":[176],"maintaining":[177],"freshness":[179],"policy":[181],"compliance.":[182],"These":[183],"demonstrate":[185],"policy-bounded":[187],"agentic":[188],"provides":[190],"an":[191],"effective":[192],"practical":[194],"approach":[195],"for":[196],"governing":[197],"enterprise":[202],"environments.":[203]},"counts_by_year":[],"updated_date":"2026-05-04T08:30:34.212998","created_date":"2026-01-02T00:00:00"}
