{"id":"https://openalex.org/W7154700396","doi":"https://doi.org/10.48550/arxiv.2604.15233","title":"Blue Data Intelligence Layer: Streaming Data and Agents for Multi-source Multi-modal Data-Centric Applications","display_name":"Blue Data Intelligence Layer: Streaming Data and Agents for Multi-source Multi-modal Data-Centric Applications","publication_year":2026,"publication_date":"2026-04-16","ids":{"openalex":"https://openalex.org/W7154700396","doi":"https://doi.org/10.48550/arxiv.2604.15233"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.15233","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.15233","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.15233","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5072105892","display_name":"Moin Aminnaseri","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Aminnaseri, Moin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075330839","display_name":"Farima Fatahi Bayat","orcid":"https://orcid.org/0000-0002-8738-411X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bayat, Farima Fatahi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040092252","display_name":"Nikita Bhutani","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bhutani, Nikita","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5093471806","display_name":"Jean-Flavien Bussotti","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bussotti, Jean-Flavien","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108420274","display_name":"Kevin Chan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chan, Kevin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065434429","display_name":"Rafael Li Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Rafael Li","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045853966","display_name":"Yanlin Feng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Feng, Yanlin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133885285","display_name":"Jackson Hassell","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hassell, Jackson","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133850662","display_name":"Estevam Hruschka","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hruschka, Estevam","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012111319","display_name":"Eser Kandogan","orcid":"https://orcid.org/0009-0004-3509-5502"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kandogan, Eser","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133917575","display_name":"Hannah Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Hannah","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044396459","display_name":"James Levine","orcid":"https://orcid.org/0000-0002-5441-0860"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Levine, James","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133849508","display_name":"Seiji Maekawa","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Maekawa, Seiji","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111769572","display_name":"Jalal Mahmud","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mahmud, Jalal","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133861623","display_name":"Kushan Mitra","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mitra, Kushan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133853391","display_name":"Naoki Otani","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Otani, Naoki","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022655234","display_name":"Pouya Pezeshkpour","orcid":"https://orcid.org/0009-0002-7055-0035"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pezeshkpour, Pouya","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032735930","display_name":"Nima Shahbazi","orcid":"https://orcid.org/0000-0001-7016-3807"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shahbazi, Nima","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133889672","display_name":"Chen Shen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shen, Chen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133889074","display_name":"Dan Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Dan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":20,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.3840999901294708,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.3840999901294708,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.22859999537467957,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.051899999380111694,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/query-language","display_name":"Query language","score":0.5479000210762024},{"id":"https://openalex.org/keywords/metadata","display_name":"Metadata","score":0.5383999943733215},{"id":"https://openalex.org/keywords/data-integration","display_name":"Data integration","score":0.4717999994754791},{"id":"https://openalex.org/keywords/xquery","display_name":"XQuery","score":0.4674000144004822},{"id":"https://openalex.org/keywords/data-access","display_name":"Data access","score":0.43849998712539673},{"id":"https://openalex.org/keywords/sql","display_name":"SQL","score":0.42399999499320984},{"id":"https://openalex.org/keywords/bridge","display_name":"Bridge (graph theory)","score":0.4074999988079071},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.4009000062942505},{"id":"https://openalex.org/keywords/relational-database","display_name":"Relational database","score":0.400299996137619},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.39820000529289246}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8544999957084656},{"id":"https://openalex.org/C192028432","wikidata":"https://www.wikidata.org/wiki/Q845739","display_name":"Query language","level":2,"score":0.5479000210762024},{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.5383999943733215},{"id":"https://openalex.org/C72634772","wikidata":"https://www.wikidata.org/wiki/Q386824","display_name":"Data integration","level":2,"score":0.4717999994754791},{"id":"https://openalex.org/C2780512708","wikidata":"https://www.wikidata.org/wiki/Q850661","display_name":"XQuery","level":4,"score":0.4674000144004822},{"id":"https://openalex.org/C47487241","wikidata":"https://www.wikidata.org/wiki/Q5227230","display_name":"Data access","level":2,"score":0.43849998712539673},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4350999891757965},{"id":"https://openalex.org/C510870499","wikidata":"https://www.wikidata.org/wiki/Q47607","display_name":"SQL","level":2,"score":0.42399999499320984},{"id":"https://openalex.org/C100776233","wikidata":"https://www.wikidata.org/wiki/Q2532492","display_name":"Bridge (graph theory)","level":2,"score":0.4074999988079071},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.4009000062942505},{"id":"https://openalex.org/C5655090","wikidata":"https://www.wikidata.org/wiki/Q192588","display_name":"Relational database","level":2,"score":0.400299996137619},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.39820000529289246},{"id":"https://openalex.org/C118930307","wikidata":"https://www.wikidata.org/wiki/Q600590","display_name":"Tuple","level":2,"score":0.3610000014305115},{"id":"https://openalex.org/C160145156","wikidata":"https://www.wikidata.org/wiki/Q778586","display_name":"Executable","level":2,"score":0.35519999265670776},{"id":"https://openalex.org/C153048206","wikidata":"https://www.wikidata.org/wiki/Q3454922","display_name":"Metadata repository","level":3,"score":0.34310001134872437},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.3361000120639801},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.33320000767707825},{"id":"https://openalex.org/C19443361","wikidata":"https://www.wikidata.org/wiki/Q5282533","display_name":"Disparate system","level":2,"score":0.3215999901294708},{"id":"https://openalex.org/C136227091","wikidata":"https://www.wikidata.org/wiki/Q5380376","display_name":"Enterprise data management","level":3,"score":0.314300000667572},{"id":"https://openalex.org/C33326189","wikidata":"https://www.wikidata.org/wiki/Q17092450","display_name":"Information integration","level":2,"score":0.2937000095844269},{"id":"https://openalex.org/C90312973","wikidata":"https://www.wikidata.org/wiki/Q7449052","display_name":"Semantic data model","level":2,"score":0.2921999990940094},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.28859999775886536},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.2842999994754791},{"id":"https://openalex.org/C30542707","wikidata":"https://www.wikidata.org/wiki/Q1603203","display_name":"Commonsense knowledge","level":3,"score":0.28299999237060547},{"id":"https://openalex.org/C100463513","wikidata":"https://www.wikidata.org/wiki/Q5227322","display_name":"Data model (GIS)","level":2,"score":0.27869999408721924},{"id":"https://openalex.org/C157170001","wikidata":"https://www.wikidata.org/wiki/Q4781507","display_name":"Applications of artificial intelligence","level":2,"score":0.2782000005245209},{"id":"https://openalex.org/C20277647","wikidata":"https://www.wikidata.org/wiki/Q5227234","display_name":"Data access layer","level":3,"score":0.27619999647140503},{"id":"https://openalex.org/C164768185","wikidata":"https://www.wikidata.org/wiki/Q2919941","display_name":"Enterprise information integration","level":5,"score":0.27549999952316284},{"id":"https://openalex.org/C138958017","wikidata":"https://www.wikidata.org/wiki/Q190087","display_name":"Data type","level":2,"score":0.2752000093460083},{"id":"https://openalex.org/C171018156","wikidata":"https://www.wikidata.org/wiki/Q7370306","display_name":"Rotation formalisms in three dimensions","level":2,"score":0.272599995136261},{"id":"https://openalex.org/C69075417","wikidata":"https://www.wikidata.org/wiki/Q515701","display_name":"Linked data","level":3,"score":0.25929999351501465},{"id":"https://openalex.org/C174252522","wikidata":"https://www.wikidata.org/wiki/Q3816772","display_name":"Natural language user interface","level":3,"score":0.25279998779296875},{"id":"https://openalex.org/C33762810","wikidata":"https://www.wikidata.org/wiki/Q461671","display_name":"Data integrity","level":2,"score":0.2526000142097473},{"id":"https://openalex.org/C137314826","wikidata":"https://www.wikidata.org/wiki/Q2330408","display_name":"Data mapping","level":2,"score":0.2524000108242035},{"id":"https://openalex.org/C2778180026","wikidata":"https://www.wikidata.org/wiki/Q18378163","display_name":"Semantic heterogeneity","level":4,"score":0.25209999084472656},{"id":"https://openalex.org/C147497476","wikidata":"https://www.wikidata.org/wiki/Q54872","display_name":"RDF","level":3,"score":0.2502000033855438}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.15233","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.15233","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.15233","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.15233","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"NL2SQL":[0],"systems":[1,261],"aim":[2],"to":[3,19,79,111,156,183,192,233],"address":[4],"the":[5,38,103,113,139,167,170],"growing":[6],"need":[7],"for":[8,97,107,150],"natural":[9,161],"language":[10,162],"interaction":[11],"with":[12,176,209],"data.":[13,67],"However,":[14],"real-world":[15],"information":[16,121],"rarely":[17],"maps":[18],"a":[20,42,88,144],"single":[21,43,265],"SQL":[22],"query":[23,179,198],"because":[24],"(1)":[25],"users":[26],"express":[27],"queries":[28,47,195,247],"iteratively":[29],"(2)":[30],"questions":[31],"often":[32],"span":[33],"multiple":[34,213],"data":[35,58,96,104,109,145,152,185,190],"sources":[36,153],"beyond":[37,264],"closed-world":[39],"assumption":[40],"of":[41,141,219],"database,":[44],"and":[45,65,83,95,119,132,154,160,169,228,231,254],"(3)":[46],"frequently":[48],"rely":[49],"on":[50,189],"commonsense":[51],"or":[52],"external":[53],"knowledge.":[54],"Consequently,":[55],"satisfying":[56],"realistic":[57],"needs":[59],"require":[60],"integrating":[61],"heterogeneous":[62],"sources,":[63,227],"modalities,":[64],"contextual":[66],"In":[68],"this":[69],"paper,":[70],"we":[71],"present":[72],"Blue's":[73],"Data":[74],"Intelligence":[75],"Layer":[76],"(DIL)":[77],"designed":[78],"support":[80,217],"multi-source,":[81],"multi-modal,":[82],"data-centric":[84],"applications.":[85],"Blue":[86],"is":[87,143],"compound":[89,259],"AI":[90,260],"system":[91],"that":[92,147,205],"orchestrates":[93],"agents":[94],"enterprise":[98,125],"settings.":[99],"DIL":[100,142,164,187,215,239],"serves":[101],"as":[102,172],"intelligence":[105],"layer":[106],"agentic":[108],"processing,":[110],"bridge":[112],"semantic":[114],"gap":[115],"between":[116],"user":[117,194,246],"intent":[118],"available":[120],"by":[122],"unifying":[123],"structured":[124],"data,":[126],"world":[127],"knowledge":[128],"accessible":[129],"through":[130,136,240],"LLMs,":[131,166],"personal":[133],"context":[134],"obtained":[135],"interaction.":[137],"At":[138],"core":[140],"registry":[146],"stores":[148],"metadata":[149],"diverse":[151,226],"modalities":[155],"enable":[157],"both":[158],"native":[159],"queries.":[163],"treats":[165],"Web,":[168],"User":[171],"source":[173],"'databases',":[174],"each":[175],"their":[177],"own":[178],"interface,":[180],"elevating":[181],"them":[182],"first-class":[184],"sources.":[186],"relies":[188],"planners":[191,216],"transform":[193],"into":[196,222],"executable":[197],"plans.":[199],"These":[200],"plans":[201],"are":[202],"declarative":[203],"abstractions":[204],"unify":[206],"relational":[207],"operators":[208,211],"other":[210],"spanning":[212],"modalities.":[214],"decomposition":[218],"complex":[220],"requests":[221],"subqueries,":[223],"retrieval":[224],"from":[225],"finally":[229],"reasoning":[230],"integration":[232],"produce":[234],"final":[235],"results.":[236],"We":[237],"demonstrate":[238],"two":[241],"interactive":[242],"scenarios":[243],"in":[244],"which":[245],"dynamically":[248],"trigger":[249],"multi-source":[250],"retrieval,":[251],"cross-modal":[252],"reasoning,":[253],"result":[255],"synthesis,":[256],"illustrating":[257],"how":[258],"can":[262],"move":[263],"database":[266],"NL2SQL.":[267]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-18T00:00:00"}
