{"id":"https://openalex.org/W2969607675","doi":"https://doi.org/10.3390/info12080316","title":"Populating Web-Scale Knowledge Graphs Using Distantly Supervised Relation Extraction and Validation","display_name":"Populating Web-Scale Knowledge Graphs Using Distantly Supervised Relation Extraction and Validation","publication_year":2021,"publication_date":"2021-08-06","ids":{"openalex":"https://openalex.org/W2969607675","doi":"https://doi.org/10.3390/info12080316","mag":"2969607675"},"language":"en","primary_location":{"id":"doi:10.3390/info12080316","is_oa":true,"landing_page_url":"https://doi.org/10.3390/info12080316","pdf_url":"https://www.mdpi.com/2078-2489/12/8/316/pdf?version=1628248438","source":{"id":"https://openalex.org/S4210219776","display_name":"Information","issn_l":"2078-2489","issn":["2078-2489"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Information","raw_type":"journal-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/2078-2489/12/8/316/pdf?version=1628248438","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101686334","display_name":"Sarthak Dash","orcid":"https://orcid.org/0000-0001-8765-4055"},"institutions":[{"id":"https://openalex.org/I4210114115","display_name":"IBM Research - Thomas J. Watson Research Center","ror":"https://ror.org/0265w5591","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Sarthak Dash","raw_affiliation_strings":["IBM Research AI, IBM Thomas J. Watson Research Center, Yorktown Heights, NY 10598, USA"],"affiliations":[{"raw_affiliation_string":"IBM Research AI, IBM Thomas J. Watson Research Center, Yorktown Heights, NY 10598, USA","institution_ids":["https://openalex.org/I4210114115"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079135719","display_name":"Michael Gla\u00df","orcid":"https://orcid.org/0000-0002-8006-8843"},"institutions":[{"id":"https://openalex.org/I4210114115","display_name":"IBM Research - Thomas J. Watson Research Center","ror":"https://ror.org/0265w5591","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Michael R. Glass","raw_affiliation_strings":["IBM Research AI, IBM Thomas J. Watson Research Center, Yorktown Heights, NY 10598, USA"],"affiliations":[{"raw_affiliation_string":"IBM Research AI, IBM Thomas J. Watson Research Center, Yorktown Heights, NY 10598, USA","institution_ids":["https://openalex.org/I4210114115"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087419620","display_name":"Alfio Gliozzo","orcid":"https://orcid.org/0000-0002-8044-2911"},"institutions":[{"id":"https://openalex.org/I4210114115","display_name":"IBM Research - Thomas J. Watson Research Center","ror":"https://ror.org/0265w5591","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alfio Gliozzo","raw_affiliation_strings":["IBM Research AI, IBM Thomas J. Watson Research Center, Yorktown Heights, NY 10598, USA"],"affiliations":[{"raw_affiliation_string":"IBM Research AI, IBM Thomas J. Watson Research Center, Yorktown Heights, NY 10598, USA","institution_ids":["https://openalex.org/I4210114115"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043925652","display_name":"Mustafa Canim","orcid":null},"institutions":[{"id":"https://openalex.org/I4210114115","display_name":"IBM Research - Thomas J. Watson Research Center","ror":"https://ror.org/0265w5591","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mustafa Canim","raw_affiliation_strings":["IBM Research AI, IBM Thomas J. Watson Research Center, Yorktown Heights, NY 10598, USA","IBM"],"affiliations":[{"raw_affiliation_string":"IBM Research AI, IBM Thomas J. Watson Research Center, Yorktown Heights, NY 10598, USA","institution_ids":["https://openalex.org/I4210114115"]},{"raw_affiliation_string":"IBM","institution_ids":[]}]},{"author_position":"last","author":{"id":null,"display_name":"Gaetano Rossiello","orcid":"https://orcid.org/0000-0003-1042-4782"},"institutions":[{"id":"https://openalex.org/I4210114115","display_name":"IBM Research - Thomas J. Watson Research Center","ror":"https://ror.org/0265w5591","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Gaetano Rossiello","raw_affiliation_strings":["IBM Research AI, IBM Thomas J. Watson Research Center, Yorktown Heights, NY 10598, USA"],"affiliations":[{"raw_affiliation_string":"IBM Research AI, IBM Thomas J. Watson Research Center, Yorktown Heights, NY 10598, USA","institution_ids":["https://openalex.org/I4210114115"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5101686334"],"corresponding_institution_ids":["https://openalex.org/I4210114115"],"apc_list":{"value":1400,"currency":"CHF","value_usd":1515},"apc_paid":{"value":1400,"currency":"CHF","value_usd":1515},"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.00365387,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"12","issue":"8","first_page":"316","last_page":"316"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8028451204299927},{"id":"https://openalex.org/keywords/relationship-extraction","display_name":"Relationship extraction","score":0.6766828894615173},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6629610061645508},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.645642876625061},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.6346890330314636},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6340546607971191},{"id":"https://openalex.org/keywords/margin","display_name":"Margin (machine learning)","score":0.6144310235977173},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5929287672042847},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.584307074546814},{"id":"https://openalex.org/keywords/relation","display_name":"Relation (database)","score":0.5112171173095703},{"id":"https://openalex.org/keywords/analytics","display_name":"Analytics","score":0.4987666606903076},{"id":"https://openalex.org/keywords/information-extraction","display_name":"Information extraction","score":0.48758429288864136},{"id":"https://openalex.org/keywords/knowledge-base","display_name":"Knowledge base","score":0.4724602699279785},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.44339683651924133},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.4191231429576874},{"id":"https://openalex.org/keywords/supervised-learning","display_name":"Supervised learning","score":0.41620540618896484},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3416483700275421},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.33743077516555786},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.28897374868392944},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.08957827091217041}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8028451204299927},{"id":"https://openalex.org/C153604712","wikidata":"https://www.wikidata.org/wiki/Q7310755","display_name":"Relationship extraction","level":3,"score":0.6766828894615173},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6629610061645508},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.645642876625061},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6346890330314636},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6340546607971191},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.6144310235977173},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5929287672042847},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.584307074546814},{"id":"https://openalex.org/C25343380","wikidata":"https://www.wikidata.org/wiki/Q277521","display_name":"Relation (database)","level":2,"score":0.5112171173095703},{"id":"https://openalex.org/C79158427","wikidata":"https://www.wikidata.org/wiki/Q485396","display_name":"Analytics","level":2,"score":0.4987666606903076},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.48758429288864136},{"id":"https://openalex.org/C4554734","wikidata":"https://www.wikidata.org/wiki/Q593744","display_name":"Knowledge base","level":2,"score":0.4724602699279785},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.44339683651924133},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4191231429576874},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.41620540618896484},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3416483700275421},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.33743077516555786},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.28897374868392944},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.08957827091217041},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0}],"mesh":[],"locations_count":5,"locations":[{"id":"doi:10.3390/info12080316","is_oa":true,"landing_page_url":"https://doi.org/10.3390/info12080316","pdf_url":"https://www.mdpi.com/2078-2489/12/8/316/pdf?version=1628248438","source":{"id":"https://openalex.org/S4210219776","display_name":"Information","issn_l":"2078-2489","issn":["2078-2489"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Information","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:1908.08104","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1908.08104","pdf_url":"https://arxiv.org/pdf/1908.08104","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"mag:2969607675","is_oa":true,"landing_page_url":"https://arxiv.org/pdf/1908.08104","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"pmh:oai:doaj.org/article:7bdd82f8c8b746c1a3965e3af319567e","is_oa":true,"landing_page_url":"https://doaj.org/article/7bdd82f8c8b746c1a3965e3af319567e","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Information, Vol 12, Iss 8, p 316 (2021)","raw_type":"article"},{"id":"doi:10.48550/arxiv.1908.08104","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1908.08104","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.3390/info12080316","is_oa":true,"landing_page_url":"https://doi.org/10.3390/info12080316","pdf_url":"https://www.mdpi.com/2078-2489/12/8/316/pdf?version=1628248438","source":{"id":"https://openalex.org/S4210219776","display_name":"Information","issn_l":"2078-2489","issn":["2078-2489"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Information","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.4099999964237213}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2969607675.pdf","grobid_xml":"https://content.openalex.org/works/W2969607675.grobid-xml"},"referenced_works_count":37,"referenced_works":["https://openalex.org/W102708294","https://openalex.org/W174427690","https://openalex.org/W205829674","https://openalex.org/W790941020","https://openalex.org/W1512387364","https://openalex.org/W1514027499","https://openalex.org/W1604644367","https://openalex.org/W1653383105","https://openalex.org/W1750263989","https://openalex.org/W1852412531","https://openalex.org/W1942169943","https://openalex.org/W1977970897","https://openalex.org/W2120663660","https://openalex.org/W2127426251","https://openalex.org/W2127795553","https://openalex.org/W2132679783","https://openalex.org/W2138204945","https://openalex.org/W2145544171","https://openalex.org/W2250521169","https://openalex.org/W2251135946","https://openalex.org/W2515462165","https://openalex.org/W2526662185","https://openalex.org/W2556343638","https://openalex.org/W2728059831","https://openalex.org/W2768762802","https://openalex.org/W2774837955","https://openalex.org/W2805381747","https://openalex.org/W2889832871","https://openalex.org/W2949972983","https://openalex.org/W2963454301","https://openalex.org/W2963485453","https://openalex.org/W2963503534","https://openalex.org/W2964217331","https://openalex.org/W6604189946","https://openalex.org/W6630579473","https://openalex.org/W6640747935","https://openalex.org/W6678830454"],"related_works":["https://openalex.org/W3191697963","https://openalex.org/W2788902803","https://openalex.org/W2752124967","https://openalex.org/W2796418006","https://openalex.org/W2510749011","https://openalex.org/W1763375142","https://openalex.org/W2742267824","https://openalex.org/W2767373106","https://openalex.org/W3166972201","https://openalex.org/W2251205667","https://openalex.org/W2272061611","https://openalex.org/W2117763124","https://openalex.org/W3169827118","https://openalex.org/W2944977718","https://openalex.org/W3168921237","https://openalex.org/W2982332369","https://openalex.org/W2982807168","https://openalex.org/W3125024313","https://openalex.org/W2134928896","https://openalex.org/W2165863615"],"abstract_inverted_index":{"In":[0,38],"this":[1],"paper,":[2],"we":[3],"propose":[4],"a":[5,23,34,43,103,119,136,166],"fully":[6],"automated":[7],"system":[8,21,41,73,111,151],"to":[9,61,81,133,140],"extend":[10,141],"knowledge":[11,48,144],"graphs":[12],"using":[13],"external":[14],"information":[15,56],"from":[16,145],"web-scale":[17,137],"corpora.":[18],"The":[19,71],"designed":[20,72],"leverages":[22],"deep-learning-based":[24],"technology":[25],"for":[26,47,79],"relation":[27,116],"extraction":[28,117],"that":[29,108,149],"can":[30],"be":[31],"trained":[32],"by":[33,51,118],"distantly":[35],"supervised":[36],"approach.":[37],"addition,":[39],"the":[40,53,58,64,67,109,113],"uses":[42],"deep":[44],"learning":[45],"approach":[46],"base":[49],"completion":[50],"utilizing":[52],"global":[54],"structure":[55],"of":[57,66,115,125,131],"induced":[59],"KG":[60],"further":[62],"refine":[63],"confidence":[65],"newly":[68],"discovered":[69],"relations.":[70],"does":[74,88,158],"not":[75,89,153,159],"require":[76,160],"any":[77,91,161],"effort":[78],"adaptation":[80,162],"new":[82],"languages":[83],"and":[84,96],"domains":[85],"as":[86],"it":[87],"use":[90],"hand-labeled":[92],"data,":[93],"NLP":[94],"analytics,":[95],"inference":[97],"rules.":[98],"Our":[99],"experiments,":[100],"performed":[101],"on":[102],"popular":[104],"academic":[105],"benchmark,":[106],"demonstrate":[107],"suggested":[110],"boosts":[112],"performance":[114],"wide":[120],"margin,":[121],"reporting":[122],"error":[123],"reductions":[124],"50%,":[126],"resulting":[127],"in":[128],"relative":[129],"improvement":[130],"up":[132],"100%.":[134],"Furthermore,":[135],"experiment":[138],"conducted":[139],"DBPedia":[142],"with":[143],"Common":[146],"Crawl":[147],"shows":[148],"our":[150],"is":[152],"only":[154],"scalable":[155],"but":[156],"also":[157],"cost,":[163],"while":[164],"yielding":[165],"substantial":[167],"accuracy":[168],"gain.":[169]},"counts_by_year":[],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
