{"id":"https://openalex.org/W3085516325","doi":"https://doi.org/10.1145/3397536.3422236","title":"A Deep Learning Approach to Geographical Candidate Selection through Toponym Matching","display_name":"A Deep Learning Approach to Geographical Candidate Selection through Toponym Matching","publication_year":2020,"publication_date":"2020-11-03","ids":{"openalex":"https://openalex.org/W3085516325","doi":"https://doi.org/10.1145/3397536.3422236","mag":"3085516325"},"language":"en","primary_location":{"id":"doi:10.1145/3397536.3422236","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3397536.3422236","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 28th International Conference on Advances in Geographic Information Systems","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2009.08114","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5051763204","display_name":"Mariona Coll Ardanuy","orcid":"https://orcid.org/0000-0001-8455-7196"},"institutions":[{"id":"https://openalex.org/I4210128584","display_name":"The Alan Turing Institute","ror":"https://ror.org/035dkdb55","country_code":"GB","type":"facility","lineage":["https://openalex.org/I4210128584"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Mariona Coll Ardanuy","raw_affiliation_strings":["The Alan Turing Institute, London, United Kingdom","The Alan Turing Institute, London (United Kingdom)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"The Alan Turing Institute, London, United Kingdom","institution_ids":["https://openalex.org/I4210128584"]},{"raw_affiliation_string":"The Alan Turing Institute, London (United Kingdom)","institution_ids":["https://openalex.org/I4210128584"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057896998","display_name":"Kasra Hosseini","orcid":"https://orcid.org/0000-0003-4396-6019"},"institutions":[{"id":"https://openalex.org/I4210128584","display_name":"The Alan Turing Institute","ror":"https://ror.org/035dkdb55","country_code":"GB","type":"facility","lineage":["https://openalex.org/I4210128584"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Kasra Hosseini","raw_affiliation_strings":["The Alan Turing Institute, London, United Kingdom","The Alan Turing Institute, London (United Kingdom)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"The Alan Turing Institute, London, United Kingdom","institution_ids":["https://openalex.org/I4210128584"]},{"raw_affiliation_string":"The Alan Turing Institute, London (United Kingdom)","institution_ids":["https://openalex.org/I4210128584"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023931434","display_name":"Katherine McDonough","orcid":"https://orcid.org/0000-0001-7506-1025"},"institutions":[{"id":"https://openalex.org/I4210128584","display_name":"The Alan Turing Institute","ror":"https://ror.org/035dkdb55","country_code":"GB","type":"facility","lineage":["https://openalex.org/I4210128584"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Katherine McDonough","raw_affiliation_strings":["The Alan Turing Institute, London, United Kingdom","The Alan Turing Institute, London (United Kingdom)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"The Alan Turing Institute, London, United Kingdom","institution_ids":["https://openalex.org/I4210128584"]},{"raw_affiliation_string":"The Alan Turing Institute, London (United Kingdom)","institution_ids":["https://openalex.org/I4210128584"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071121843","display_name":"Amrey Krause","orcid":"https://orcid.org/0000-0002-6173-6738"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Amrey Krause","raw_affiliation_strings":["Edinburgh Parallel Computing Centre, Edinburgh, United Kingdom"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Edinburgh Parallel Computing Centre, Edinburgh, United Kingdom","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038148264","display_name":"Daniel van Strien","orcid":"https://orcid.org/0000-0003-1684-6556"},"institutions":[{"id":"https://openalex.org/I2800016483","display_name":"British Library","ror":"https://ror.org/05dhe8b71","country_code":"GB","type":"archive","lineage":["https://openalex.org/I2800016483"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Daniel van Strien","raw_affiliation_strings":["The British Library London, United Kingdom","The British Library, London, United Kingdom#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"The British Library London, United Kingdom","institution_ids":["https://openalex.org/I2800016483"]},{"raw_affiliation_string":"The British Library, London, United Kingdom#TAB#","institution_ids":["https://openalex.org/I2800016483"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5064977687","display_name":"Federico Nanni","orcid":"https://orcid.org/0000-0003-2484-4331"},"institutions":[{"id":"https://openalex.org/I4210128584","display_name":"The Alan Turing Institute","ror":"https://ror.org/035dkdb55","country_code":"GB","type":"facility","lineage":["https://openalex.org/I4210128584"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Federico Nanni","raw_affiliation_strings":["The Alan Turing Institute, London, United Kingdom","The Alan Turing Institute, London (United Kingdom)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"The Alan Turing Institute, London, United Kingdom","institution_ids":["https://openalex.org/I4210128584"]},{"raw_affiliation_string":"The Alan Turing Institute, London (United Kingdom)","institution_ids":["https://openalex.org/I4210128584"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.1354,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.56134031,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"385","last_page":"388"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9945999979972839,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9945999979972839,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10757","display_name":"Geographic Information Systems Studies","score":0.9847999811172485,"subfield":{"id":"https://openalex.org/subfields/3305","display_name":"Geography, Planning and Development"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9847000241279602,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.863627552986145},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.7237486243247986},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.64764803647995},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.624167799949646},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5984047651290894},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5308619141578674},{"id":"https://openalex.org/keywords/toponymy","display_name":"Toponymy","score":0.4815090596675873},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.43635815382003784},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.41497015953063965},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.413802832365036},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.10568469762802124}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.863627552986145},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.7237486243247986},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.64764803647995},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.624167799949646},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5984047651290894},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5308619141578674},{"id":"https://openalex.org/C116856471","wikidata":"https://www.wikidata.org/wiki/Q485762","display_name":"Toponymy","level":2,"score":0.4815090596675873},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.43635815382003784},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.41497015953063965},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.413802832365036},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.10568469762802124},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0}],"mesh":[],"locations_count":5,"locations":[{"id":"doi:10.1145/3397536.3422236","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3397536.3422236","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 28th International Conference on Advances in Geographic Information Systems","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2009.08114","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2009.08114","pdf_url":"https://arxiv.org/pdf/2009.08114","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"mag:3085516325","is_oa":true,"landing_page_url":"http://export.arxiv.org/pdf/2009.08114","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"pmh:oai:pure.ed.ac.uk:openaire/aecb2f1c-90d6-42c8-b712-f667d8fb5ce3","is_oa":true,"landing_page_url":"https://www.research.ed.ac.uk/en/publications/aecb2f1c-90d6-42c8-b712-f667d8fb5ce3","pdf_url":null,"source":{"id":"https://openalex.org/S4306400321","display_name":"Edinburgh Research Explorer (University of Edinburgh)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I98677209","host_organization_name":"University of Edinburgh","host_organization_lineage":["https://openalex.org/I98677209"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Ardanuy, M C, Hosseini, K, McDonough, K, Krause, A, Van Strien, D & Nanni, F 2020, A Deep Learning Approach to Geographical Candidate Selection through Toponym Matching. in C-T Lu, F Wang, G Trajcevski, Y Huang, S Newsam & L Xiong (eds), Proceedings of the 28th International Conference on Advances in Geographic Information Systems, SIGSPATIAL GIS 2020. GIS: Proceedings of the ACM International Symposium on Advances in Geographic Information Systems, pp. 385-388, 28th ACM SIGSPATIAL International Conference on Advances in Geographic Information Systems, SIGSPATIAL GIS 2020, Virtual, Online, United States, 3/11/20. https://doi.org/10.1145/3397536.3422236","raw_type":"contributionToPeriodical"},{"id":"doi:10.48550/arxiv.2009.08114","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2009.08114","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2009.08114","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2009.08114","pdf_url":"https://arxiv.org/pdf/2009.08114","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.6200000047683716,"display_name":"Quality Education"}],"awards":[{"id":"https://openalex.org/G1633672591","display_name":null,"funder_award_id":"N510129","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G3713837730","display_name":"Living with Machines","funder_award_id":"AH/S01179X/1","funder_id":"https://openalex.org/F4320334609","funder_display_name":"Arts and Humanities Research Council"},{"id":"https://openalex.org/G7651018554","display_name":null,"funder_award_id":"AH/S01179X/1","funder_id":"https://openalex.org/F4320314731","funder_display_name":"UK Research and Innovation"},{"id":"https://openalex.org/G8583665056","display_name":null,"funder_award_id":"EP/ N510129/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G8597009950","display_name":null,"funder_award_id":"EP/N510129/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"}],"funders":[{"id":"https://openalex.org/F4320314731","display_name":"UK Research and Innovation","ror":"https://ror.org/001aqnf71"},{"id":"https://openalex.org/F4320334609","display_name":"Arts and Humanities Research Council","ror":"https://ror.org/0505m1554"},{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3085516325.pdf","grobid_xml":"https://content.openalex.org/works/W3085516325.grobid-xml"},"referenced_works_count":35,"referenced_works":["https://openalex.org/W86887328","https://openalex.org/W1548663377","https://openalex.org/W1554612027","https://openalex.org/W1967688128","https://openalex.org/W1990871427","https://openalex.org/W2018277822","https://openalex.org/W2087323714","https://openalex.org/W2088091054","https://openalex.org/W2104583100","https://openalex.org/W2123142779","https://openalex.org/W2127289991","https://openalex.org/W2134118576","https://openalex.org/W2135451108","https://openalex.org/W2137435333","https://openalex.org/W2226371358","https://openalex.org/W2250554077","https://openalex.org/W2251896305","https://openalex.org/W2515960978","https://openalex.org/W2593929528","https://openalex.org/W2612773933","https://openalex.org/W2615263010","https://openalex.org/W2765285316","https://openalex.org/W2896425349","https://openalex.org/W2945214661","https://openalex.org/W2950333738","https://openalex.org/W2950844738","https://openalex.org/W2952490462","https://openalex.org/W2964075320","https://openalex.org/W2990579790","https://openalex.org/W2998702515","https://openalex.org/W3012289950","https://openalex.org/W3105241684","https://openalex.org/W3109019412","https://openalex.org/W4247397059","https://openalex.org/W4292083459"],"related_works":["https://openalex.org/W3109019412","https://openalex.org/W2808008092","https://openalex.org/W2788931857","https://openalex.org/W3039491967","https://openalex.org/W2940674603","https://openalex.org/W2003869148","https://openalex.org/W2984895664","https://openalex.org/W2921058576","https://openalex.org/W3115612113","https://openalex.org/W3177210555","https://openalex.org/W3101680040","https://openalex.org/W2033673704","https://openalex.org/W1561860492","https://openalex.org/W3093143956","https://openalex.org/W2516823085","https://openalex.org/W2897566602","https://openalex.org/W1654545971","https://openalex.org/W3043728279","https://openalex.org/W3163177512","https://openalex.org/W3162486530"],"abstract_inverted_index":{"Recognizing":[0],"toponyms":[1],"and":[2,114,122,135],"resolving":[3],"them":[4],"to":[5,11,16,46],"their":[6],"real-world":[7],"referents":[8],"is":[9,21,34],"required":[10],"provide":[12],"advanced":[13],"semantic":[14],"access":[15],"textual":[17],"data.":[18],"This":[19],"process":[20],"often":[22],"hindered":[23],"by":[24,47],"the":[25,35,39,127],"high":[26],"degree":[27],"of":[28,37,129],"variation":[29],"in":[30,72,126,133],"toponyms.":[31],"Candidate":[32],"selection":[33,60,88,132],"task":[36],"identifying":[38],"potential":[40],"entities":[41],"that":[42],"can":[43],"be":[44],"referred":[45],"a":[48,62,82],"previously":[49],"recognized":[50],"toponym.":[51],"While":[52],"it":[53],"has":[54,61],"traditionally":[55],"received":[56],"little":[57],"attention,":[58],"candidate":[59,87,131],"significant":[63],"impact":[64],"on":[65,105],"downstream":[66],"tasks":[67],"(i.e.":[68],"entity":[69],"resolution),":[70],"especially":[71],"noisy":[73],"or":[74],"non-standard":[75],"text.":[76],"In":[77],"this":[78],"paper,":[79],"we":[80],"introduce":[81],"deep":[83],"learning":[84],"method":[85],"for":[86],"through":[89],"toponym":[90,101],"matching,":[91],"using":[92],"state-of-the-art":[93],"neural":[94],"network":[95],"architectures.":[96],"We":[97],"perform":[98],"an":[99],"intrinsic":[100],"matching":[102],"evaluation":[103],"based":[104],"several":[106],"datasets,":[107],"which":[108],"cover":[109],"various":[110],"challenging":[111],"scenarios":[112],"(cross-lingual":[113],"regional":[115],"variations,":[116],"as":[117,119],"well":[118],"OCR":[120],"errors)":[121],"assess":[123],"its":[124],"performance":[125],"context":[128],"geographical":[130],"English":[134],"Spanish.":[136]},"counts_by_year":[{"year":2022,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2022-07-25T00:00:00"}
