{"id":"https://openalex.org/W4393636323","doi":"https://doi.org/10.5281/zenodo.6523400","title":"Gollum: A Gold Standard for Large Scale\\\\Multi Source Knowledge Graph Matching","display_name":"Gollum: A Gold Standard for Large Scale\\\\Multi Source Knowledge Graph Matching","publication_year":2022,"publication_date":"2022-05-06","ids":{"openalex":"https://openalex.org/W4393636323","doi":"https://doi.org/10.5281/zenodo.6523400"},"language":"en","primary_location":{"id":"pmh:oai:zenodo.org:6523400","is_oa":true,"landing_page_url":"https://zenodo.org/record/6523400","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/other"},"type":"dataset","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://zenodo.org/record/6523400","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113159735","display_name":"Sven Herting","orcid":null},"institutions":[{"id":"https://openalex.org/I177802217","display_name":"University of Mannheim","ror":"https://ror.org/031bsb921","country_code":"DE","type":"education","lineage":["https://openalex.org/I177802217"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Herting, Sven","raw_affiliation_strings":["University of Mannheim"],"raw_orcid":"https://orcid.org/0000-0003-0333-5888","affiliations":[{"raw_affiliation_string":"University of Mannheim","institution_ids":["https://openalex.org/I177802217"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5040542771","display_name":"Heiko Paulheim","orcid":null},"institutions":[{"id":"https://openalex.org/I177802217","display_name":"University of Mannheim","ror":"https://ror.org/031bsb921","country_code":"DE","type":"education","lineage":["https://openalex.org/I177802217"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Paulheim, Heiko","raw_affiliation_strings":["University of Mannheim"],"raw_orcid":"https://orcid.org/0000-0003-4386-8195","affiliations":[{"raw_affiliation_string":"University of Mannheim","institution_ids":["https://openalex.org/I177802217"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5113159735"],"corresponding_institution_ids":["https://openalex.org/I177802217"],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.9811999797821045,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.9811999797821045,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.6466042399406433},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5451074242591858},{"id":"https://openalex.org/keywords/knowledge-graph","display_name":"Knowledge graph","score":0.5067070126533508},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.47550636529922485},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.4731998145580292},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.2939326763153076},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.29366397857666016},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.2886241376399994},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.1767134964466095},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.16056647896766663},{"id":"https://openalex.org/keywords/cartography","display_name":"Cartography","score":0.10703185200691223}],"concepts":[{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.6466042399406433},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5451074242591858},{"id":"https://openalex.org/C2987255567","wikidata":"https://www.wikidata.org/wiki/Q33002955","display_name":"Knowledge graph","level":2,"score":0.5067070126533508},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.47550636529922485},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.4731998145580292},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2939326763153076},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.29366397857666016},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.2886241376399994},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.1767134964466095},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.16056647896766663},{"id":"https://openalex.org/C58640448","wikidata":"https://www.wikidata.org/wiki/Q42515","display_name":"Cartography","level":1,"score":0.10703185200691223}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:zenodo.org:6523400","is_oa":true,"landing_page_url":"https://zenodo.org/record/6523400","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/other"},{"id":"doi:10.5281/zenodo.6523400","is_oa":true,"landing_page_url":"https://doi.org/10.5281/zenodo.6523400","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"dataset"}],"best_oa_location":{"id":"pmh:oai:zenodo.org:6523400","is_oa":true,"landing_page_url":"https://zenodo.org/record/6523400","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/other"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W2382290278","https://openalex.org/W2478288626","https://openalex.org/W4391913857","https://openalex.org/W2350741829","https://openalex.org/W2054026175"],"abstract_inverted_index":{"The":[0],"set":[1],"of":[2,88,139,252],"Knowledge":[3],"Graphs":[4],"(KGs)":[5],"generated":[6],"with":[7,111,149],"automatic":[8],"and":[9,19,61,72,157,175,178],"manual":[10],"approaches":[11,39,238],"is":[12,26,169,184],"constantly":[13],"growing.<br>":[14],"For":[15],"an":[16,21],"integrated":[17],"view":[18],"usage,":[20],"alignment":[22],"between":[23,115],"these":[24],"KGs":[25,82],"necessary":[27],"on":[28],"the":[29,86,127,140,173,188,191,203,221,245,250,253,260],"schema":[30],"as":[31,33],"well":[32],"instance":[34],"level.<br>":[35],"There":[36],"are":[37,55,69,85,143,216,257],"already":[38],"which":[40,78,84,215,239],"try":[41],"to":[42,57,131,197,209,219,249],"tackle":[43],"this":[44,95,231],"multi":[45,106,222,235],"source":[46,107,236],"knowledge":[47,108,122],"graph":[48,109],"matching":[49,90,110,155,212,224,237],"problem,<br>":[50],"but":[51],"large":[52,133],"gold":[53,67,102,141],"standards":[54,68],"missing":[56],"evaluate":[58,234],"their":[59],"effectiveness":[60],"scalability.<br>":[62],"In":[63],"particular,":[64],"most":[65],"existing":[66,89],"fairly":[70],"small":[71],"can":[73],"be":[74],"solved":[75],"by":[76,97,125],"matchers":[77,243],"match":[79],"exactly":[80],"two":[81,158],"(1:1),":[83],"majority":[87],"systems.<br>":[91],"<br>":[92,136,194,214],"We":[93,195],"close":[94],"gap":[96],"presenting":[98],"Gollum":[99],"--":[100],"a":[101,132,147,227],"standard":[103,142],"for":[104,152,160,211],"large-scale":[105],"over":[112],"275,000":[113],"correspondences":[114,151],"4,149":[116],"different":[117],"KGs.<br>":[118],"They":[119],"originate":[120],"from":[121,244],"graphs":[123],"derived":[124],"applying":[126],"DBpedia":[128],"extraction":[129],"framework":[130],"wiki":[134],"farm.<br>":[135],"Three":[137],"variations":[138],"made":[144],"available:<br>":[145],"(1)":[146],"version":[148],"all":[150],"evaluating":[153,161],"unsupervised":[154],"approaches,":[156],"versions":[159],"supervised":[162],"matching:":[163],"(2)":[164],"one":[165,180],"where":[166,181],"each":[167,182],"KG":[168,183,200,223,254],"contained":[170,186],"both":[171],"in":[172,187],"train":[174,189],"test":[176,192],"set,":[177],"(3)":[179],"exclusively":[185],"or":[190],"set.":[193],"plan":[196],"extend":[198],"our":[199],"track":[201],"at":[202,259],"Ontology":[204],"Alignment":[205],"Evaluation":[206],"Initiative":[207],"(OAEI)":[208],"allow":[210],"systems":[213],"specifically":[217],"designed":[218],"solve":[220],"problem.<br>":[225],"As":[226],"first":[228],"step":[229],"towards":[230],"direction,":[232],"we":[233],"reuse":[240],"two-KG":[241],"(1:1)":[242],"past":[246],"OAEI.":[247],"Due":[248],"size":[251],"files,":[255],"they":[256],"hosted":[258],"institute:":[261],"http://data.dws.informatik.uni-mannheim.de/dbkwik/gollum/40K.tar":[262],"(50,3":[263],"GB)<br>":[264,267],"http://data.dws.informatik.uni-mannheim.de/dbkwik/gollum/all.tar":[265],"(74,7":[266],"http://data.dws.informatik.uni-mannheim.de/dbkwik/gollum/gold.tar":[268],"(25,3":[269],"GB)":[270]},"counts_by_year":[],"updated_date":"2025-11-06T06:51:31.235846","created_date":"2025-10-10T00:00:00"}
