{"id":"https://openalex.org/W7125829827","doi":"https://doi.org/10.48550/arxiv.2601.17546","title":"Push Down Optimization for Distributed Multi Cloud Data Integration","display_name":"Push Down Optimization for Distributed Multi Cloud Data Integration","publication_year":2026,"publication_date":"2026-01-24","ids":{"openalex":"https://openalex.org/W7125829827","doi":"https://doi.org/10.48550/arxiv.2601.17546"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2601.17546","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.17546","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2601.17546","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5124009035","display_name":"Ravi Kiran Kodali","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Kodali, Ravi Kiran","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123903383","display_name":"Vinoth Punniyamoorthy","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Punniyamoorthy, Vinoth","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123886576","display_name":"Akash Kumar Agarwal","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Agarwal, Akash Kumar","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123998514","display_name":"Bikesh Kumar","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kumar, Bikesh","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123930790","display_name":"Balakrishna Pothineni","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pothineni, Balakrishna","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124050744","display_name":"Aswathnarayan Muthukrishnan Kirubakaran","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kirubakaran, Aswathnarayan Muthukrishnan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123948034","display_name":"Sumit Saha","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Saha, Sumit","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5123946414","display_name":"Nachiappan Chockalingam","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chockalingam, Nachiappan","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5124009035"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.8636999726295471,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.8636999726295471,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.03060000017285347,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11614","display_name":"Cloud Data Security Solutions","score":0.013799999840557575,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.850600004196167},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6108999848365784},{"id":"https://openalex.org/keywords/data-migration","display_name":"Data migration","score":0.45829999446868896},{"id":"https://openalex.org/keywords/sql","display_name":"SQL","score":0.4300000071525574},{"id":"https://openalex.org/keywords/pipeline-transport","display_name":"Pipeline transport","score":0.42329999804496765},{"id":"https://openalex.org/keywords/cloud-database","display_name":"Cloud database","score":0.42239999771118164},{"id":"https://openalex.org/keywords/data-integration","display_name":"Data integration","score":0.41359999775886536},{"id":"https://openalex.org/keywords/data-transmission","display_name":"Data transmission","score":0.4041000008583069},{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.39340001344680786},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.3885999917984009}],"concepts":[{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.850600004196167},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7498999834060669},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6108999848365784},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.531499981880188},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.5087000131607056},{"id":"https://openalex.org/C146152329","wikidata":"https://www.wikidata.org/wiki/Q1932543","display_name":"Data migration","level":2,"score":0.45829999446868896},{"id":"https://openalex.org/C510870499","wikidata":"https://www.wikidata.org/wiki/Q47607","display_name":"SQL","level":2,"score":0.4300000071525574},{"id":"https://openalex.org/C175309249","wikidata":"https://www.wikidata.org/wiki/Q725864","display_name":"Pipeline transport","level":2,"score":0.42329999804496765},{"id":"https://openalex.org/C2778974508","wikidata":"https://www.wikidata.org/wiki/Q2499178","display_name":"Cloud database","level":3,"score":0.42239999771118164},{"id":"https://openalex.org/C72634772","wikidata":"https://www.wikidata.org/wiki/Q386824","display_name":"Data integration","level":2,"score":0.41359999775886536},{"id":"https://openalex.org/C557945733","wikidata":"https://www.wikidata.org/wiki/Q389772","display_name":"Data transmission","level":2,"score":0.4041000008583069},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.39340001344680786},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.3885999917984009},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.37709999084472656},{"id":"https://openalex.org/C188087704","wikidata":"https://www.wikidata.org/wiki/Q369577","display_name":"Standardization","level":2,"score":0.37130001187324524},{"id":"https://openalex.org/C5655090","wikidata":"https://www.wikidata.org/wiki/Q192588","display_name":"Relational database","level":2,"score":0.3605000078678131},{"id":"https://openalex.org/C65813073","wikidata":"https://www.wikidata.org/wiki/Q1622420","display_name":"High availability","level":2,"score":0.35190001130104065},{"id":"https://openalex.org/C70061542","wikidata":"https://www.wikidata.org/wiki/Q989016","display_name":"Distributed database","level":2,"score":0.34700000286102295},{"id":"https://openalex.org/C153740404","wikidata":"https://www.wikidata.org/wiki/Q671224","display_name":"Data center","level":2,"score":0.34689998626708984},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.33739998936653137},{"id":"https://openalex.org/C2779599972","wikidata":"https://www.wikidata.org/wiki/Q82231","display_name":"NoSQL","level":3,"score":0.335099995136261},{"id":"https://openalex.org/C32587265","wikidata":"https://www.wikidata.org/wiki/Q1182260","display_name":"Data deduplication","level":2,"score":0.3093000054359436},{"id":"https://openalex.org/C93996380","wikidata":"https://www.wikidata.org/wiki/Q44127","display_name":"Server","level":2,"score":0.30250000953674316},{"id":"https://openalex.org/C120115606","wikidata":"https://www.wikidata.org/wiki/Q5135723","display_name":"Cloud testing","level":4,"score":0.30219998955726624},{"id":"https://openalex.org/C46637626","wikidata":"https://www.wikidata.org/wiki/Q6693015","display_name":"Low latency (capital markets)","level":2,"score":0.29499998688697815},{"id":"https://openalex.org/C2778505942","wikidata":"https://www.wikidata.org/wiki/Q18344624","display_name":"Microservices","level":3,"score":0.289900004863739},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.28929999470710754},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.27900001406669617},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.2782999873161316},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.2775000035762787},{"id":"https://openalex.org/C2776175482","wikidata":"https://www.wikidata.org/wiki/Q1195816","display_name":"Transfer (computing)","level":2,"score":0.2775000035762787},{"id":"https://openalex.org/C199168358","wikidata":"https://www.wikidata.org/wiki/Q3367000","display_name":"Orchestration","level":3,"score":0.2720000147819519},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.27140000462532043},{"id":"https://openalex.org/C69016650","wikidata":"https://www.wikidata.org/wiki/Q1364211","display_name":"Multitenancy","level":5,"score":0.26339998841285706}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2601.17546","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.17546","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2601.17546","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.17546","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","score":0.6005523800849915,"display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Enterprises":[0],"increasingly":[1],"adopt":[2,150],"multi":[3,90],"cloud":[4,56,91,114,159],"architectures":[5],"to":[6,68,132,151],"take":[7],"advantage":[8],"of":[9,85],"diverse":[10],"database":[11,42],"engines,":[12,73],"regional":[13],"availability,":[14],"and":[15,31,76,94,98,107,124,138,155],"cost":[16,140],"models.":[17],"In":[18],"these":[19],"environments,":[20],"ETL":[21,48,92,153],"pipelines":[22,93],"must":[23],"process":[24],"large,":[25],"distributed":[26,158],"datasets":[27],"while":[28,116],"minimizing":[29],"latency":[30],"transfer":[32,136],"cost.":[33],"Push":[34],"down":[35,87],"optimization,":[36],"which":[37],"executes":[38],"transformation":[39],"logic":[40],"within":[41,46],"engines":[43],"rather":[44],"than":[45],"the":[47,83],"tool,":[49],"has":[50],"proven":[51],"highly":[52],"effective":[53],"in":[54,89,157],"single":[55],"systems.":[57],"However,":[58],"when":[59],"applied":[60],"across":[61,122],"multiple":[62],"clouds,":[63],"it":[64],"faces":[65],"challenges":[66],"related":[67],"data":[69,108],"movement,":[70],"heterogeneous":[71],"SQL":[72],"orchestration":[74],"complexity,":[75],"fragmented":[77],"security":[78],"controls.":[79],"This":[80],"paper":[81],"examines":[82],"feasibility":[84],"push":[86,103],"optimization":[88],"analyzes":[95],"its":[96],"benefits":[97],"limitations.":[99],"It":[100],"evaluates":[101],"localized":[102],"down,":[104],"hybrid":[105],"models,":[106],"federation":[109],"techniques":[110],"that":[111,147],"reduce":[112],"cross":[113],"traffic":[115],"improving":[117],"performance.":[118],"A":[119],"case":[120],"study":[121,143],"Redshift":[123],"BigQuery":[125],"demonstrates":[126],"measurable":[127],"gains,":[128],"including":[129],"lower":[130],"end":[131,133],"runtime,":[134],"reduced":[135],"volume,":[137],"improved":[139],"efficiency.":[141],"The":[142],"highlights":[144],"practical":[145],"strategies":[146],"organizations":[148],"can":[149],"improve":[152],"scalability":[154],"reliability":[156],"environments.":[160]},"counts_by_year":[],"updated_date":"2026-01-28T23:18:48.515280","created_date":"2026-01-28T00:00:00"}
