{"id":"https://openalex.org/W4406458164","doi":"https://doi.org/10.1109/bigdata62323.2024.10825736","title":"INTEGRATE-KG: A Workflow For Unifying Heterogeneous Data Driven by Shared Languages","display_name":"INTEGRATE-KG: A Workflow For Unifying Heterogeneous Data Driven by Shared Languages","publication_year":2024,"publication_date":"2024-12-15","ids":{"openalex":"https://openalex.org/W4406458164","doi":"https://doi.org/10.1109/bigdata62323.2024.10825736"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata62323.2024.10825736","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata62323.2024.10825736","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Big Data (BigData)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5060552352","display_name":"Nahed Abu Zaid","orcid":null},"institutions":[{"id":"https://openalex.org/I137902535","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Nahed Abu Zaid","raw_affiliation_strings":["North Carolina State University,Raleigh,North Carolina,USA"],"affiliations":[{"raw_affiliation_string":"North Carolina State University,Raleigh,North Carolina,USA","institution_ids":["https://openalex.org/I137902535"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045531668","display_name":"Kara Schatz","orcid":"https://orcid.org/0000-0003-2310-5131"},"institutions":[{"id":"https://openalex.org/I194120229","display_name":"Xavier University","ror":"https://ror.org/00f266q65","country_code":"US","type":"education","lineage":["https://openalex.org/I194120229"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kara Schatz","raw_affiliation_strings":["Xavier University,Cincinnati,Ohio,USA"],"affiliations":[{"raw_affiliation_string":"Xavier University,Cincinnati,Ohio,USA","institution_ids":["https://openalex.org/I194120229"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006129934","display_name":"Kimberly Bourne","orcid":null},"institutions":[{"id":"https://openalex.org/I430192","display_name":"Appalachian State University","ror":"https://ror.org/051m4vc48","country_code":"US","type":"education","lineage":["https://openalex.org/I430192"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kimberly Bourne","raw_affiliation_strings":["Appalachian State University,Boone,North Carolina,USA"],"affiliations":[{"raw_affiliation_string":"Appalachian State University,Boone,North Carolina,USA","institution_ids":["https://openalex.org/I430192"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008494701","display_name":"Darrell Harry","orcid":null},"institutions":[{"id":"https://openalex.org/I137902535","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Darrell Harry","raw_affiliation_strings":["North Carolina State University,Raleigh,North Carolina,USA"],"affiliations":[{"raw_affiliation_string":"North Carolina State University,Raleigh,North Carolina,USA","institution_ids":["https://openalex.org/I137902535"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067181746","display_name":"Christine Ogilvie Hendren","orcid":"https://orcid.org/0000-0002-9546-6545"},"institutions":[{"id":"https://openalex.org/I430192","display_name":"Appalachian State University","ror":"https://ror.org/051m4vc48","country_code":"US","type":"education","lineage":["https://openalex.org/I430192"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Christine Hendren","raw_affiliation_strings":["Appalachian State University,Boone,North Carolina,USA"],"affiliations":[{"raw_affiliation_string":"Appalachian State University,Boone,North Carolina,USA","institution_ids":["https://openalex.org/I430192"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072312029","display_name":"Anna\u2010Maria Marshall","orcid":"https://orcid.org/0000-0002-0458-7203"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Anna-Maria Marshall","raw_affiliation_strings":["University of Illinois Urbana-Champaign,Urbana,Illinois,USA"],"affiliations":[{"raw_affiliation_string":"University of Illinois Urbana-Champaign,Urbana,Illinois,USA","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062810411","display_name":"Khara Grieger","orcid":"https://orcid.org/0000-0002-0821-0534"},"institutions":[{"id":"https://openalex.org/I137902535","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Khara Grieger","raw_affiliation_strings":["North Carolina State University,Raleigh,North Carolina,USA"],"affiliations":[{"raw_affiliation_string":"North Carolina State University,Raleigh,North Carolina,USA","institution_ids":["https://openalex.org/I137902535"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003785721","display_name":"Jacob L. Jones","orcid":"https://orcid.org/0000-0002-9182-0957"},"institutions":[{"id":"https://openalex.org/I137902535","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jacob Jones","raw_affiliation_strings":["North Carolina State University,Raleigh,North Carolina,USA"],"affiliations":[{"raw_affiliation_string":"North Carolina State University,Raleigh,North Carolina,USA","institution_ids":["https://openalex.org/I137902535"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069527267","display_name":"Alexey V. Gulyuk","orcid":"https://orcid.org/0000-0002-9924-8713"},"institutions":[{"id":"https://openalex.org/I137902535","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alexey V. Gulyuk","raw_affiliation_strings":["North Carolina State University,Raleigh,North Carolina,USA"],"affiliations":[{"raw_affiliation_string":"North Carolina State University,Raleigh,North Carolina,USA","institution_ids":["https://openalex.org/I137902535"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046770281","display_name":"Yaroslava G. Yingling","orcid":"https://orcid.org/0000-0002-8557-9992"},"institutions":[{"id":"https://openalex.org/I137902535","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yaroslava G. Yingling","raw_affiliation_strings":["North Carolina State University,Raleigh,North Carolina,USA"],"affiliations":[{"raw_affiliation_string":"North Carolina State University,Raleigh,North Carolina,USA","institution_ids":["https://openalex.org/I137902535"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5078910758","display_name":"Rada Chirkova","orcid":"https://orcid.org/0000-0003-4249-9690"},"institutions":[{"id":"https://openalex.org/I137902535","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Rada Chirkova","raw_affiliation_strings":["North Carolina State University,Raleigh,North Carolina,USA"],"affiliations":[{"raw_affiliation_string":"North Carolina State University,Raleigh,North Carolina,USA","institution_ids":["https://openalex.org/I137902535"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":11,"corresponding_author_ids":["https://openalex.org/A5060552352"],"corresponding_institution_ids":["https://openalex.org/I137902535"],"apc_list":null,"apc_paid":null,"fwci":1.0924,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.82936318,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"3522","last_page":"3531"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.9954000115394592,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9904999732971191,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7864522933959961},{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.7617360353469849},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.51433265209198},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.4707012176513672},{"id":"https://openalex.org/keywords/software-engineering","display_name":"Software engineering","score":0.4531573951244354},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.3379678726196289},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.249001145362854}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7864522933959961},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.7617360353469849},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.51433265209198},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.4707012176513672},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.4531573951244354},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3379678726196289},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.249001145362854}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigdata62323.2024.10825736","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata62323.2024.10825736","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Big Data (BigData)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W8870360","https://openalex.org/W2144211451","https://openalex.org/W2242464395","https://openalex.org/W2342249984","https://openalex.org/W2852434548","https://openalex.org/W2896457183","https://openalex.org/W2903963001","https://openalex.org/W2918428907","https://openalex.org/W2970861952","https://openalex.org/W2972167903","https://openalex.org/W2979826702","https://openalex.org/W3010336026","https://openalex.org/W3022290554","https://openalex.org/W3093789214","https://openalex.org/W4308206224","https://openalex.org/W4308335753","https://openalex.org/W4378376239","https://openalex.org/W4382599418","https://openalex.org/W4391093129","https://openalex.org/W4399783095","https://openalex.org/W4401009895","https://openalex.org/W4401807469","https://openalex.org/W6600367688","https://openalex.org/W6636510571","https://openalex.org/W6675354045","https://openalex.org/W6755207826","https://openalex.org/W6767463829","https://openalex.org/W6767905578","https://openalex.org/W7002254874"],"related_works":["https://openalex.org/W1981780420","https://openalex.org/W2182707996","https://openalex.org/W45233828","https://openalex.org/W2964988449","https://openalex.org/W2397952901","https://openalex.org/W2029380707","https://openalex.org/W188202134","https://openalex.org/W4255934811","https://openalex.org/W2465382974","https://openalex.org/W2010229520"],"abstract_inverted_index":{"In":[0],"large-scale":[1],"multidisciplinary":[2],"consortia":[3,27,57],"endeavors":[4],"that":[5,102,129],"address":[6,119],"problems":[7],"of":[8,45,64,71,93,99,110,141,146,153],"research,":[9],"industry,":[10],"and":[11,77,199,215,221],"public-good":[12],"significance,":[13],"it":[14,211],"is":[15,89,130,149],"typically":[16],"a":[17,30,38,124,181],"priority":[18],"to":[19,61,75,115,161,195,212],"integrate":[20],"the":[21,26,42,46,62,69,91,108,111,120,139,147,154,158,167,186,203],"heterogeneous":[22],"data":[23,32,43,48,101,169,217],"contributed":[24],"by":[25],"participants":[28,74],"into":[29,96],"unified":[31,97],"representation.":[33],"Knowledge":[34],"graphs":[35],"(KGs)":[36],"are":[37],"typical":[39],"choice":[40],"for":[41,138,157,176,183,192,224],"model":[44],"resulting":[47],"repositories.":[49],"To":[50],"overcome":[51],"potential":[52],"issues":[53],"with":[54,68,107,190,209],"terminology":[55,117,164],"misalignment,":[56],"commonly":[58],"dedicate":[59],"resources":[60],"development":[63],"shared":[65,113,159,188],"languages":[66,114,160],"(vocabularies),":[67],"intent":[70],"enabling":[72],"diverse":[73,100],"understand":[76],"build":[78],"on":[79,90,206,218],"each":[80],"other\u2019s":[81],"work.":[82],"Our":[83],"research":[84],"focus":[85],"in":[86,150,228],"this":[87],"paper":[88],"challenge":[92],"automating":[94],"integration":[95],"KGs":[98],"potentially":[103],"use":[104,152],"different":[105],"terminology,":[106],"help":[109],"available":[112,156,187],"resolve":[116],"clashes.To":[118],"challenge,":[121],"we":[122],"introduce":[123],"data-integration":[125],"workflow":[126],"called":[127],"INTEGRATE-KG":[128,178,229],"domain":[131,134,193,226],"agnostic,":[132],"yet":[133],"aware":[135],"through":[136],"opportunities":[137,191],"involvement":[140],"humans-in-the-loop.":[142,231],"A":[143],"key":[144],"feature":[145],"approach":[148],"its":[151],"synonyms":[155],"automate":[162],"semantics-level":[163],"alignment":[165],"across":[166],"individual":[168],"contributions":[170],"after":[171],"they":[172],"have":[173],"been":[174],"submitted":[175],"integration.":[177],"also":[179],"includes":[180],"module":[182],"automatically":[184],"enriching":[185],"languages,":[189],"experts":[194,227],"provide":[196,222],"semantic":[197],"corrections":[198],"feedback.":[200],"We":[201],"present":[202],"workflow,":[204],"report":[205],"our":[207],"experiences":[208],"applying":[210],"experimental,":[213],"survey,":[214],"shared-language":[216],"phosphorus":[219],"sustainability,":[220],"suggestions":[223],"involving":[225],"as":[230]},"counts_by_year":[{"year":2025,"cited_by_count":3}],"updated_date":"2026-03-09T08:58:05.943551","created_date":"2025-10-10T00:00:00"}
