{"id":"https://openalex.org/W2889003264","doi":"https://doi.org/10.14778/3229863.3240491","title":"Open data integration","display_name":"Open data integration","publication_year":2018,"publication_date":"2018-08-01","ids":{"openalex":"https://openalex.org/W2889003264","doi":"https://doi.org/10.14778/3229863.3240491","mag":"2889003264"},"language":"en","primary_location":{"id":"doi:10.14778/3229863.3240491","is_oa":false,"landing_page_url":"https://doi.org/10.14778/3229863.3240491","pdf_url":null,"source":{"id":"https://openalex.org/S4210226185","display_name":"Proceedings of the VLDB Endowment","issn_l":"2150-8097","issn":["2150-8097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the VLDB Endowment","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5022619313","display_name":"Ren\u00e9e J. Miller","orcid":"https://orcid.org/0000-0002-1484-4787"},"institutions":[{"id":"https://openalex.org/I87182695","display_name":"Universidad del Noreste","ror":"https://ror.org/02ahky613","country_code":"MX","type":"education","lineage":["https://openalex.org/I87182695"]}],"countries":["MX"],"is_corresponding":true,"raw_author_name":"Ren\u00e9e J. Miller","raw_affiliation_strings":["Northeastern University"],"affiliations":[{"raw_affiliation_string":"Northeastern University","institution_ids":["https://openalex.org/I87182695"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5022619313"],"corresponding_institution_ids":["https://openalex.org/I87182695"],"apc_list":null,"apc_paid":null,"fwci":8.0463,"has_fulltext":false,"cited_by_count":84,"citation_normalized_percentile":{"value":0.97664971,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":"11","issue":"12","first_page":"2130","last_page":"2139"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.813219428062439},{"id":"https://openalex.org/keywords/open-data","display_name":"Open data","score":0.6210149526596069},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.6103595495223999},{"id":"https://openalex.org/keywords/data-integration","display_name":"Data integration","score":0.5978695154190063},{"id":"https://openalex.org/keywords/data-virtualization","display_name":"Data virtualization","score":0.504231333732605},{"id":"https://openalex.org/keywords/linked-data","display_name":"Linked data","score":0.4929206371307373},{"id":"https://openalex.org/keywords/data-warehouse","display_name":"Data warehouse","score":0.48070818185806274},{"id":"https://openalex.org/keywords/data-discovery","display_name":"Data discovery","score":0.4358759820461273},{"id":"https://openalex.org/keywords/semi-structured-data","display_name":"Semi-structured data","score":0.42646878957748413},{"id":"https://openalex.org/keywords/knowledge-extraction","display_name":"Knowledge extraction","score":0.42367759346961975},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.40781354904174805},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.35119330883026123},{"id":"https://openalex.org/keywords/semantic-web","display_name":"Semantic Web","score":0.3330836296081543},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.29655301570892334},{"id":"https://openalex.org/keywords/relational-database","display_name":"Relational database","score":0.21604010462760925},{"id":"https://openalex.org/keywords/metadata","display_name":"Metadata","score":0.18185144662857056},{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.1531527042388916}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.813219428062439},{"id":"https://openalex.org/C2780535194","wikidata":"https://www.wikidata.org/wiki/Q309901","display_name":"Open data","level":2,"score":0.6210149526596069},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.6103595495223999},{"id":"https://openalex.org/C72634772","wikidata":"https://www.wikidata.org/wiki/Q386824","display_name":"Data integration","level":2,"score":0.5978695154190063},{"id":"https://openalex.org/C80344994","wikidata":"https://www.wikidata.org/wiki/Q5227369","display_name":"Data virtualization","level":4,"score":0.504231333732605},{"id":"https://openalex.org/C69075417","wikidata":"https://www.wikidata.org/wiki/Q515701","display_name":"Linked data","level":3,"score":0.4929206371307373},{"id":"https://openalex.org/C135572916","wikidata":"https://www.wikidata.org/wiki/Q193351","display_name":"Data warehouse","level":2,"score":0.48070818185806274},{"id":"https://openalex.org/C2777516300","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data discovery","level":3,"score":0.4358759820461273},{"id":"https://openalex.org/C40077939","wikidata":"https://www.wikidata.org/wiki/Q2336004","display_name":"Semi-structured data","level":3,"score":0.42646878957748413},{"id":"https://openalex.org/C120567893","wikidata":"https://www.wikidata.org/wiki/Q1582085","display_name":"Knowledge extraction","level":2,"score":0.42367759346961975},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.40781354904174805},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.35119330883026123},{"id":"https://openalex.org/C2129575","wikidata":"https://www.wikidata.org/wiki/Q54837","display_name":"Semantic Web","level":2,"score":0.3330836296081543},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.29655301570892334},{"id":"https://openalex.org/C5655090","wikidata":"https://www.wikidata.org/wiki/Q192588","display_name":"Relational database","level":2,"score":0.21604010462760925},{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.18185144662857056},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.1531527042388916},{"id":"https://openalex.org/C513985346","wikidata":"https://www.wikidata.org/wiki/Q270471","display_name":"Virtualization","level":3,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.14778/3229863.3240491","is_oa":false,"landing_page_url":"https://doi.org/10.14778/3229863.3240491","pdf_url":null,"source":{"id":"https://openalex.org/S4210226185","display_name":"Proceedings of the VLDB Endowment","issn_l":"2150-8097","issn":["2150-8097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the VLDB Endowment","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Partnerships for the goals","id":"https://metadata.un.org/sdg/17","score":0.5299999713897705}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":82,"referenced_works":["https://openalex.org/W1491409610","https://openalex.org/W1503955515","https://openalex.org/W1536525420","https://openalex.org/W1547612978","https://openalex.org/W1556076816","https://openalex.org/W1588213250","https://openalex.org/W1721994796","https://openalex.org/W1864010644","https://openalex.org/W1875032969","https://openalex.org/W1879587332","https://openalex.org/W1922832738","https://openalex.org/W1969621019","https://openalex.org/W1976957990","https://openalex.org/W1980302278","https://openalex.org/W1981578383","https://openalex.org/W1993783004","https://openalex.org/W1996505782","https://openalex.org/W2006149654","https://openalex.org/W2015191210","https://openalex.org/W2020022499","https://openalex.org/W2022166150","https://openalex.org/W2025151754","https://openalex.org/W2030072751","https://openalex.org/W2038276547","https://openalex.org/W2042389627","https://openalex.org/W2059268928","https://openalex.org/W2060805613","https://openalex.org/W2066806792","https://openalex.org/W2073329022","https://openalex.org/W2089634871","https://openalex.org/W2100365109","https://openalex.org/W2102729564","https://openalex.org/W2105436061","https://openalex.org/W2108223890","https://openalex.org/W2108489852","https://openalex.org/W2117200425","https://openalex.org/W2121269638","https://openalex.org/W2125149214","https://openalex.org/W2128056631","https://openalex.org/W2130825214","https://openalex.org/W2134876510","https://openalex.org/W2139021951","https://openalex.org/W2140116426","https://openalex.org/W2143455443","https://openalex.org/W2147717514","https://openalex.org/W2148781362","https://openalex.org/W2161666572","https://openalex.org/W2162520370","https://openalex.org/W2167847032","https://openalex.org/W2189052568","https://openalex.org/W2216189112","https://openalex.org/W2224038009","https://openalex.org/W2249895122","https://openalex.org/W2251018714","https://openalex.org/W2293253366","https://openalex.org/W2293618136","https://openalex.org/W2341748398","https://openalex.org/W2396588571","https://openalex.org/W2400256190","https://openalex.org/W2438792749","https://openalex.org/W2576439162","https://openalex.org/W2585438896","https://openalex.org/W2610492020","https://openalex.org/W2616147950","https://openalex.org/W2624356872","https://openalex.org/W2741470040","https://openalex.org/W2750620035","https://openalex.org/W2750991217","https://openalex.org/W2752618741","https://openalex.org/W2792572948","https://openalex.org/W2798664493","https://openalex.org/W2798901078","https://openalex.org/W2811097925","https://openalex.org/W2963174348","https://openalex.org/W2963626623","https://openalex.org/W3121289605","https://openalex.org/W6633446409","https://openalex.org/W6680052129","https://openalex.org/W6712839960","https://openalex.org/W6732417551","https://openalex.org/W6733170484","https://openalex.org/W6753098016"],"related_works":["https://openalex.org/W4285228649","https://openalex.org/W4253617153","https://openalex.org/W2535793348","https://openalex.org/W3123392925","https://openalex.org/W2293051076","https://openalex.org/W2229112513","https://openalex.org/W2582017389","https://openalex.org/W2926120048","https://openalex.org/W1887370195","https://openalex.org/W2070438616"],"abstract_inverted_index":{"Open":[0,17],"data":[1,25,34,38,51,67,76,81,104,125,144,155,172,183],"plays":[2],"a":[3,46,86,98,127,132,160],"major":[4],"role":[5],"in":[6,166],"supporting":[7],"both":[8],"governmental":[9],"and":[10,28,68,123,163,179],"organizational":[11],"transparency.":[12],"Many":[13],"organizations":[14],"are":[15,78],"adopting":[16],"Data":[18],"Principles":[19],"promising":[20],"to":[21,37,61,64,96,113,118],"make":[22,32],"their":[23],"open":[24,66],"complete,":[26],"primary,":[27],"timely.":[29],"These":[30],"properties":[31],"this":[33],"tremendously":[35],"valuable":[36],"scientists.":[39],"However,":[40],"scientists":[41],"generally":[42],"do":[43],"not":[44],"have":[45],"priori":[47],"knowledge":[48],"about":[49,137],"what":[50],"is":[52,83,95,112,142,152],"available":[53],"(its":[54],"schema":[55],"or":[56,74,170],"content).":[57],"Nevertheless,":[58],"they":[59,77],"want":[60],"be":[62],"able":[63],"use":[65],"integrate":[69],"it":[70],"with":[71],"other":[72],"public":[73],"private":[75],"studying.":[79],"Traditionally,":[80],"integration":[82,138],"done":[84],"using":[85],"framework":[87],"called":[88],"query":[89,99],"discovery":[90,150,173],"where":[91,139],"the":[92,115,140],"main":[93],"task":[94],"discover":[97],"(or":[100],"transformation)":[101],"that":[102,151,175],"translates":[103],"from":[105],"one":[106],"form":[107],"into":[108,126],"another.":[109],"The":[110],"goal":[111],"find":[114],"right":[116],"operators":[117],"join,":[119],"nest,":[120],"group,":[121],"link,":[122],"twist":[124],"desired":[128],"form.":[129],"We":[130,158],"introduce":[131],"new":[133],"paradigm":[134],"for":[135],"thinking":[136],"focus":[141],"on":[143],"discovery,":[145],"but":[146],"highly":[147],"efficient":[148],"internet-scale":[149],"driven":[153],"by":[154],"analysis":[156],"needs.":[157],"describe":[159],"research":[161],"agenda":[162],"recent":[164],"progress":[165],"developing":[167],"scalable":[168],"data-analysis":[169],"query-aware":[171],"algorithms":[174],"provide":[176],"high":[177],"recall":[178],"accuracy":[180],"over":[181],"massive":[182],"repositories.":[184]},"counts_by_year":[{"year":2025,"cited_by_count":12},{"year":2024,"cited_by_count":9},{"year":2023,"cited_by_count":14},{"year":2022,"cited_by_count":11},{"year":2021,"cited_by_count":12},{"year":2020,"cited_by_count":19},{"year":2019,"cited_by_count":6},{"year":2018,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
