{"id":"https://openalex.org/W2026810221","doi":"https://doi.org/10.1145/2506182.2506198","title":"Improving efficiency and accuracy in multilingual entity extraction","display_name":"Improving efficiency and accuracy in multilingual entity extraction","publication_year":2013,"publication_date":"2013-09-04","ids":{"openalex":"https://openalex.org/W2026810221","doi":"https://doi.org/10.1145/2506182.2506198","mag":"2026810221"},"language":"en","primary_location":{"id":"doi:10.1145/2506182.2506198","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2506182.2506198","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 9th International Conference on Semantic Systems","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://zenodo.org/record/3438995","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5076793943","display_name":"Joachim Daiber","orcid":"https://orcid.org/0000-0003-2151-6826"},"institutions":[{"id":"https://openalex.org/I169381384","display_name":"University of Groningen","ror":"https://ror.org/012p63287","country_code":"NL","type":"education","lineage":["https://openalex.org/I169381384"]}],"countries":["NL"],"is_corresponding":true,"raw_author_name":"Joachim Daiber","raw_affiliation_strings":["Computational Linguistics Rijksuniversiteit Groningen, Groningen, The Netherlands"],"affiliations":[{"raw_affiliation_string":"Computational Linguistics Rijksuniversiteit Groningen, Groningen, The Netherlands","institution_ids":["https://openalex.org/I169381384"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009956728","display_name":"Max Jakob","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Max Jakob","raw_affiliation_strings":["Neofonie GmbH, Berlin, Germany"],"affiliations":[{"raw_affiliation_string":"Neofonie GmbH, Berlin, Germany","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023447446","display_name":"Chris Hokamp","orcid":null},"institutions":[{"id":"https://openalex.org/I123534392","display_name":"University of North Texas","ror":"https://ror.org/00v97ad02","country_code":"US","type":"education","lineage":["https://openalex.org/I123534392"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Chris Hokamp","raw_affiliation_strings":["University of North Texas, Denton, TX"],"affiliations":[{"raw_affiliation_string":"University of North Texas, Denton, TX","institution_ids":["https://openalex.org/I123534392"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5012347190","display_name":"Pablo N. Mendes","orcid":"https://orcid.org/0000-0002-0079-7991"},"institutions":[{"id":"https://openalex.org/I19648265","display_name":"Wright State University","ror":"https://ror.org/04qk6pt94","country_code":"US","type":"education","lineage":["https://openalex.org/I19648265"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Pablo N. Mendes","raw_affiliation_strings":["Wright State University, Dayton, OH","wright state university, Dayton, OH"],"affiliations":[{"raw_affiliation_string":"Wright State University, Dayton, OH","institution_ids":["https://openalex.org/I19648265"]},{"raw_affiliation_string":"wright state university, Dayton, OH","institution_ids":["https://openalex.org/I19648265"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5076793943"],"corresponding_institution_ids":["https://openalex.org/I169381384"],"apc_list":null,"apc_paid":null,"fwci":53.3796,"has_fulltext":false,"cited_by_count":513,"citation_normalized_percentile":{"value":0.99891611,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"121","last_page":"124"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10679","display_name":"Service-Oriented Architecture and Web Services","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.9189602136611938},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6490190029144287},{"id":"https://openalex.org/keywords/entity-linking","display_name":"Entity linking","score":0.6353408694267273},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.6260446906089783},{"id":"https://openalex.org/keywords/named-entity-recognition","display_name":"Named-entity recognition","score":0.5253150463104248},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.5156370401382446},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5003805160522461},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4926791787147522},{"id":"https://openalex.org/keywords/information-extraction","display_name":"Information extraction","score":0.49133697152137756},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.42327994108200073},{"id":"https://openalex.org/keywords/knowledge-base","display_name":"Knowledge base","score":0.09983742237091064},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.08579570055007935}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.9189602136611938},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6490190029144287},{"id":"https://openalex.org/C96711827","wikidata":"https://www.wikidata.org/wiki/Q17012245","display_name":"Entity linking","level":3,"score":0.6353408694267273},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6260446906089783},{"id":"https://openalex.org/C2779135771","wikidata":"https://www.wikidata.org/wiki/Q403574","display_name":"Named-entity recognition","level":3,"score":0.5253150463104248},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.5156370401382446},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5003805160522461},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4926791787147522},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.49133697152137756},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.42327994108200073},{"id":"https://openalex.org/C4554734","wikidata":"https://www.wikidata.org/wiki/Q593744","display_name":"Knowledge base","level":2,"score":0.09983742237091064},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.08579570055007935},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/2506182.2506198","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2506182.2506198","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 9th International Conference on Semantic Systems","raw_type":"proceedings-article"},{"id":"pmh:oai:zenodo.org:3438995","is_oa":true,"landing_page_url":"https://zenodo.org/record/3438995","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/conferencePaper"}],"best_oa_location":{"id":"pmh:oai:zenodo.org:3438995","is_oa":true,"landing_page_url":"https://zenodo.org/record/3438995","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/conferencePaper"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.6499999761581421}],"awards":[{"id":"https://openalex.org/G2991613951","display_name":null,"funder_award_id":"Dicode (GA no. 257184)","funder_id":"https://openalex.org/F4320334960","funder_display_name":"Seventh Framework Programme"}],"funders":[{"id":"https://openalex.org/F4320309327","display_name":"Google","ror":"https://ror.org/00njsd438"},{"id":"https://openalex.org/F4320332555","display_name":"Magyar Tudom\u00e1nyos Akad\u00e9mia Sz\u00e1m\u00edt\u00e1stechnikai \u00e9s Automatiz\u00e1l\u00e1si Kutat\u00f3int\u00e9zet","ror":"https://ror.org/0249v7n71"},{"id":"https://openalex.org/F4320334960","display_name":"Seventh Framework Programme","ror":"https://ror.org/00k4n6c32"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":5,"referenced_works":["https://openalex.org/W178672779","https://openalex.org/W2100341149","https://openalex.org/W2104583100","https://openalex.org/W2162638401","https://openalex.org/W2250919158"],"related_works":["https://openalex.org/W2186562580","https://openalex.org/W3198729192","https://openalex.org/W4255258373","https://openalex.org/W2593907245","https://openalex.org/W3000685722","https://openalex.org/W2520117834","https://openalex.org/W3133906981","https://openalex.org/W4390279576","https://openalex.org/W3006227201","https://openalex.org/W3160627956"],"abstract_inverted_index":{"There":[0],"has":[1,27],"recently":[2],"been":[3],"an":[4],"increased":[5],"interest":[6],"in":[7,85,120,126],"named":[8],"entity":[9],"recognition":[10,121],"and":[11,31,46,66,83,91,110,122],"disambiguation":[12,123],"systems":[13],"at":[14],"major":[15],"conferences":[16],"such":[17],"as":[18],"WWW,":[19],"SIGIR,":[20],"ACL,":[21],"KDD,":[22],"etc.":[23],"However,":[24],"most":[25],"work":[26],"focused":[28],"on":[29],"algorithms":[30],"evaluations,":[32],"leaving":[33],"little":[34],"space":[35,81],"for":[36,98],"implementation":[37,45],"details.":[38],"In":[39],"this":[40],"paper,":[41],"we":[42,50,95,107],"discuss":[43],"some":[44],"data":[47],"processing":[48],"challenges":[49,109],"encountered":[51],"while":[52],"developing":[53],"a":[54],"new":[55],"multilingual":[56],"version":[57],"of":[58,88,124],"DBpedia":[59],"Spotlight":[60],"that":[61],"is":[62],"faster,":[63],"more":[64],"accurate":[65],"easier":[67],"to":[68,74,112],"configure.":[69],"We":[70],"compare":[71],"our":[72],"solution":[73],"the":[75,86,89,103,114],"previous":[76],"system,":[77],"considering":[78],"time":[79],"performance,":[80],"requirements":[82],"accuracy":[84],"context":[87],"Dutch":[90],"English":[92],"languages.":[93],"Additionally,":[94],"report":[96],"results":[97],"9":[99],"additional":[100],"languages":[101],"among":[102],"largest":[104],"Wikipedias.":[105],"Finally,":[106],"present":[108],"experiences":[111],"foment":[113],"discussion":[115],"with":[116],"other":[117],"developers":[118],"interested":[119],"entities":[125],"natural":[127],"language":[128],"text.":[129]},"counts_by_year":[{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":19},{"year":2023,"cited_by_count":36},{"year":2022,"cited_by_count":20},{"year":2021,"cited_by_count":58},{"year":2020,"cited_by_count":63},{"year":2019,"cited_by_count":72},{"year":2018,"cited_by_count":62},{"year":2017,"cited_by_count":65},{"year":2016,"cited_by_count":61},{"year":2015,"cited_by_count":28},{"year":2014,"cited_by_count":21},{"year":2013,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
