{"id":"https://openalex.org/W1984464248","doi":"https://doi.org/10.1109/icdew.2014.6818303","title":"Bootstrapping Wikipedia to answer ambiguous person name queries","display_name":"Bootstrapping Wikipedia to answer ambiguous person name queries","publication_year":2014,"publication_date":"2014-03-01","ids":{"openalex":"https://openalex.org/W1984464248","doi":"https://doi.org/10.1109/icdew.2014.6818303","mag":"1984464248"},"language":"en","primary_location":{"id":"doi:10.1109/icdew.2014.6818303","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icdew.2014.6818303","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 IEEE 30th International Conference on Data Engineering Workshops","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5068894225","display_name":"Toni Gruetze","orcid":null},"institutions":[{"id":"https://openalex.org/I143288331","display_name":"Hasso Plattner Institute","ror":"https://ror.org/058rn5r42","country_code":"DE","type":"facility","lineage":["https://openalex.org/I143288331","https://openalex.org/I176453806"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Toni Gruetze","raw_affiliation_strings":["Hasso Plattner Institute, Potsdam, Germany","Hasso Plattner Institute, Prof.-Dr.-Helmert-Stra\u00dfe 2-3, 14482 Potsdam, Germany"],"affiliations":[{"raw_affiliation_string":"Hasso Plattner Institute, Potsdam, Germany","institution_ids":["https://openalex.org/I143288331"]},{"raw_affiliation_string":"Hasso Plattner Institute, Prof.-Dr.-Helmert-Stra\u00dfe 2-3, 14482 Potsdam, Germany","institution_ids":["https://openalex.org/I143288331"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024434748","display_name":"Gjergji Kasneci","orcid":null},"institutions":[{"id":"https://openalex.org/I143288331","display_name":"Hasso Plattner Institute","ror":"https://ror.org/058rn5r42","country_code":"DE","type":"facility","lineage":["https://openalex.org/I143288331","https://openalex.org/I176453806"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Gjergji Kasneci","raw_affiliation_strings":["Hasso Plattner Institute, Potsdam, Germany","Hasso Plattner Institute, Prof.-Dr.-Helmert-Stra\u00dfe 2-3, 14482 Potsdam, Germany"],"affiliations":[{"raw_affiliation_string":"Hasso Plattner Institute, Potsdam, Germany","institution_ids":["https://openalex.org/I143288331"]},{"raw_affiliation_string":"Hasso Plattner Institute, Prof.-Dr.-Helmert-Stra\u00dfe 2-3, 14482 Potsdam, Germany","institution_ids":["https://openalex.org/I143288331"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003857202","display_name":"Zhe Zuo","orcid":null},"institutions":[{"id":"https://openalex.org/I143288331","display_name":"Hasso Plattner Institute","ror":"https://ror.org/058rn5r42","country_code":"DE","type":"facility","lineage":["https://openalex.org/I143288331","https://openalex.org/I176453806"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Zhe Zuo","raw_affiliation_strings":["Hasso Plattner Institute, Potsdam, Germany","Hasso Plattner Institute, Prof.-Dr.-Helmert-Stra\u00dfe 2-3, 14482 Potsdam, Germany"],"affiliations":[{"raw_affiliation_string":"Hasso Plattner Institute, Potsdam, Germany","institution_ids":["https://openalex.org/I143288331"]},{"raw_affiliation_string":"Hasso Plattner Institute, Prof.-Dr.-Helmert-Stra\u00dfe 2-3, 14482 Potsdam, Germany","institution_ids":["https://openalex.org/I143288331"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5053028480","display_name":"Felix Naumann","orcid":"https://orcid.org/0000-0002-4483-1389"},"institutions":[{"id":"https://openalex.org/I143288331","display_name":"Hasso Plattner Institute","ror":"https://ror.org/058rn5r42","country_code":"DE","type":"facility","lineage":["https://openalex.org/I143288331","https://openalex.org/I176453806"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Felix Naumann","raw_affiliation_strings":["Hasso Plattner Institute, Potsdam, Germany","Hasso Plattner Institute, Prof.-Dr.-Helmert-Stra\u00dfe 2-3, 14482 Potsdam, Germany"],"affiliations":[{"raw_affiliation_string":"Hasso Plattner Institute, Potsdam, Germany","institution_ids":["https://openalex.org/I143288331"]},{"raw_affiliation_string":"Hasso Plattner Institute, Prof.-Dr.-Helmert-Stra\u00dfe 2-3, 14482 Potsdam, Germany","institution_ids":["https://openalex.org/I143288331"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5068894225"],"corresponding_institution_ids":["https://openalex.org/I143288331"],"apc_list":null,"apc_paid":null,"fwci":1.44894316,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.84709659,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"56","last_page":"61"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9922999739646912,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9904000163078308,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8157196044921875},{"id":"https://openalex.org/keywords/pagerank","display_name":"PageRank","score":0.7747184038162231},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.7234809994697571},{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.6942538619041443},{"id":"https://openalex.org/keywords/popularity","display_name":"Popularity","score":0.6149356365203857},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.6087848544120789},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.5909807085990906},{"id":"https://openalex.org/keywords/bootstrapping","display_name":"Bootstrapping (finance)","score":0.5761626362800598},{"id":"https://openalex.org/keywords/web-page","display_name":"Web page","score":0.46594178676605225},{"id":"https://openalex.org/keywords/search-engine","display_name":"Search engine","score":0.45411092042922974},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.4441661238670349},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.42088013887405396},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2069035768508911},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.09569776058197021}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8157196044921875},{"id":"https://openalex.org/C2779172887","wikidata":"https://www.wikidata.org/wiki/Q184316","display_name":"PageRank","level":2,"score":0.7747184038162231},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.7234809994697571},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.6942538619041443},{"id":"https://openalex.org/C2780586970","wikidata":"https://www.wikidata.org/wiki/Q1357284","display_name":"Popularity","level":2,"score":0.6149356365203857},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.6087848544120789},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.5909807085990906},{"id":"https://openalex.org/C207609745","wikidata":"https://www.wikidata.org/wiki/Q4944086","display_name":"Bootstrapping (finance)","level":2,"score":0.5761626362800598},{"id":"https://openalex.org/C21959979","wikidata":"https://www.wikidata.org/wiki/Q36774","display_name":"Web page","level":2,"score":0.46594178676605225},{"id":"https://openalex.org/C97854310","wikidata":"https://www.wikidata.org/wiki/Q19541","display_name":"Search engine","level":2,"score":0.45411092042922974},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.4441661238670349},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.42088013887405396},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2069035768508911},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09569776058197021},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C149782125","wikidata":"https://www.wikidata.org/wiki/Q160039","display_name":"Econometrics","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icdew.2014.6818303","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icdew.2014.6818303","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 IEEE 30th International Conference on Data Engineering Workshops","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Decent work and economic growth","id":"https://metadata.un.org/sdg/8","score":0.4000000059604645}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":27,"referenced_works":["https://openalex.org/W86887328","https://openalex.org/W1482174963","https://openalex.org/W1605544227","https://openalex.org/W1854214752","https://openalex.org/W1945100810","https://openalex.org/W1971318281","https://openalex.org/W1981590391","https://openalex.org/W1982678692","https://openalex.org/W1995099886","https://openalex.org/W2033073041","https://openalex.org/W2048978851","https://openalex.org/W2060314721","https://openalex.org/W2100958137","https://openalex.org/W2113227740","https://openalex.org/W2113586662","https://openalex.org/W2121080163","https://openalex.org/W2123492197","https://openalex.org/W2130395434","https://openalex.org/W2338237122","https://openalex.org/W2754038687","https://openalex.org/W4302802341","https://openalex.org/W6603544577","https://openalex.org/W6628614335","https://openalex.org/W6678401714","https://openalex.org/W6679397115","https://openalex.org/W6703593779","https://openalex.org/W6744621523"],"related_works":["https://openalex.org/W2368605798","https://openalex.org/W2518037665","https://openalex.org/W2348524959","https://openalex.org/W2477036161","https://openalex.org/W2368049389","https://openalex.org/W2384861574","https://openalex.org/W4294565801","https://openalex.org/W2170801710","https://openalex.org/W1989785885","https://openalex.org/W2358249271"],"abstract_inverted_index":{"Some":[0],"of":[1,6,37,43,115,141,146,211],"the":[2,41,57,78,84,93,107,116,120,137,164,184,193,197],"main":[3],"ranking":[4,17],"features":[5,29],"today's":[7],"search":[8,44,125],"engines":[9],"reflect":[10],"result":[11],"popularity":[12],"and":[13,25,68,172],"are":[14,72,139],"based":[15],"on":[16,166,207,220],"models,":[18],"such":[19,28,156],"as":[20,157],"PageRank,":[21],"implicit":[22],"feedback":[23],"aggregation,":[24],"more.":[26],"While":[27],"yield":[30],"satisfactory":[31,53],"results":[32,54,90,126,194],"for":[33,45,49],"a":[34,50,64,131,208],"wide":[35],"range":[36],"queries,":[38],"they":[39],"aggravate":[40],"problem":[42,103],"ambiguous":[46,181,222],"entities:":[47],"Searching":[48],"person":[51,58,94,182,223],"yields":[52],"only":[55],"if":[56],"in":[59,74,95,119,152,200],"question":[60],"is":[61,104,169],"represented":[62],"by":[63,134],"high-ranked":[65],"Web":[66,153,214],"page":[67],"all":[69],"required":[70],"information":[71,148,165,185],"contained":[73],"this":[75,102],"page.":[76],"Otherwise,":[77],"user":[79],"has":[80,127],"to":[81,91,100,105,129,191,196],"either":[82],"reformulate/refine":[83],"query":[85],"or":[86],"manually":[87],"inspect":[88],"low-ranked":[89],"find":[92],"question.":[96],"A":[97,144],"possible":[98],"approach":[99],"solve":[101],"cluster":[106,112],"results,":[108],"so":[109],"that":[110,177],"each":[111],"represents":[113],"one":[114],"persons":[117,150],"occurring":[118,199],"answer":[121],"set.":[122],"However":[123],"clustering":[124],"proven":[128],"be":[130,189],"difficult":[132],"endeavor":[133],"itself,":[135],"where":[136],"clusters":[138],"typically":[140],"moderate":[142],"quality.":[143],"wealth":[145],"useful":[147],"about":[149],"occurs":[151],"2.0":[154],"platforms,":[155],"Wikipedia,":[158],"LinkedIn,":[159],"Facebook,":[160],"etc.":[161],"Being":[162],"human-generated,":[163],"these":[167],"platforms":[168],"clean,":[170],"focused,":[171],"already":[173],"disambiguated.":[174],"We":[175,202],"show":[176],"when":[178],"searching":[179],"with":[180],"names":[183],"from":[186,217],"Wikipedia":[187],"can":[188],"bootstrapped":[190],"group":[192],"according":[195],"individuals":[198],"them.":[201],"have":[203],"evaluated":[204],"our":[205],"methods":[206],"hand-labeled":[209],"dataset":[210],"around":[212],"5,000":[213],"pages":[215],"retrieved":[216],"Google":[218],"queries":[219],"50":[221],"names.":[224]},"counts_by_year":[{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
