{"id":"https://openalex.org/W1996408240","doi":"https://doi.org/10.1145/2494188.2494193","title":"Extraction of Address Data from Unstructured Text using Free Knowledge Resources","display_name":"Extraction of Address Data from Unstructured Text using Free Knowledge Resources","publication_year":2013,"publication_date":"2013-09-04","ids":{"openalex":"https://openalex.org/W1996408240","doi":"https://doi.org/10.1145/2494188.2494193","mag":"1996408240"},"language":"en","primary_location":{"id":"doi:10.1145/2494188.2494193","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2494188.2494193","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 13th International Conference on Knowledge Management and Knowledge Technologies","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5045720797","display_name":"Sebastian Schmidt","orcid":"https://orcid.org/0000-0001-9028-8914"},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technical University of Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Sebastian Schmidt","raw_affiliation_strings":["Multimedia Communications Lab, Technische Universit\u00e4t, Darmstadt, Germany"],"affiliations":[{"raw_affiliation_string":"Multimedia Communications Lab, Technische Universit\u00e4t, Darmstadt, Germany","institution_ids":["https://openalex.org/I31512782"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068848089","display_name":"Simon Manschitz","orcid":"https://orcid.org/0000-0001-6419-8157"},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technical University of Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Simon Manschitz","raw_affiliation_strings":["Multimedia Communications Lab, Technische Universit\u00e4t, Darmstadt, Germany"],"affiliations":[{"raw_affiliation_string":"Multimedia Communications Lab, Technische Universit\u00e4t, Darmstadt, Germany","institution_ids":["https://openalex.org/I31512782"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009893898","display_name":"Christoph Rensing","orcid":"https://orcid.org/0000-0002-1287-216X"},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technical University of Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Christoph Rensing","raw_affiliation_strings":["Multimedia Communications Lab, Technische Universit\u00e4t, Darmstadt, Germany"],"affiliations":[{"raw_affiliation_string":"Multimedia Communications Lab, Technische Universit\u00e4t, Darmstadt, Germany","institution_ids":["https://openalex.org/I31512782"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5004933128","display_name":"Ralf Steinmetz","orcid":"https://orcid.org/0000-0002-6839-9359"},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technical University of Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Ralf Steinmetz","raw_affiliation_strings":["Multimedia Communications Lab, Technische Universit\u00e4t, Darmstadt, Germany"],"affiliations":[{"raw_affiliation_string":"Multimedia Communications Lab, Technische Universit\u00e4t, Darmstadt, Germany","institution_ids":["https://openalex.org/I31512782"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5045720797"],"corresponding_institution_ids":["https://openalex.org/I31512782"],"apc_list":null,"apc_paid":null,"fwci":1.6179,"has_fulltext":false,"cited_by_count":12,"citation_normalized_percentile":{"value":0.87654366,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10679","display_name":"Service-Oriented Architecture and Web Services","score":0.9854999780654907,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9804999828338623,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8391202688217163},{"id":"https://openalex.org/keywords/information-extraction","display_name":"Information extraction","score":0.6454165577888489},{"id":"https://openalex.org/keywords/unstructured-data","display_name":"Unstructured data","score":0.5963066816329956},{"id":"https://openalex.org/keywords/semantic-web","display_name":"Semantic Web","score":0.5432880520820618},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5273569226264954},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.5239301323890686},{"id":"https://openalex.org/keywords/knowledge-extraction","display_name":"Knowledge extraction","score":0.5192332863807678},{"id":"https://openalex.org/keywords/precision-and-recall","display_name":"Precision and recall","score":0.49249252676963806},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.46730944514274597},{"id":"https://openalex.org/keywords/web-intelligence","display_name":"Web intelligence","score":0.4529380798339844},{"id":"https://openalex.org/keywords/web-modeling","display_name":"Web modeling","score":0.43275201320648193},{"id":"https://openalex.org/keywords/data-web","display_name":"Data Web","score":0.42980632185935974},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.3538244962692261},{"id":"https://openalex.org/keywords/web-service","display_name":"Web service","score":0.2874850630760193},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.24910244345664978},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.09847334027290344}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8391202688217163},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.6454165577888489},{"id":"https://openalex.org/C2781252014","wikidata":"https://www.wikidata.org/wiki/Q1141900","display_name":"Unstructured data","level":3,"score":0.5963066816329956},{"id":"https://openalex.org/C2129575","wikidata":"https://www.wikidata.org/wiki/Q54837","display_name":"Semantic Web","level":2,"score":0.5432880520820618},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5273569226264954},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.5239301323890686},{"id":"https://openalex.org/C120567893","wikidata":"https://www.wikidata.org/wiki/Q1582085","display_name":"Knowledge extraction","level":2,"score":0.5192332863807678},{"id":"https://openalex.org/C81669768","wikidata":"https://www.wikidata.org/wiki/Q2359161","display_name":"Precision and recall","level":2,"score":0.49249252676963806},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.46730944514274597},{"id":"https://openalex.org/C544335954","wikidata":"https://www.wikidata.org/wiki/Q2553348","display_name":"Web intelligence","level":4,"score":0.4529380798339844},{"id":"https://openalex.org/C130436687","wikidata":"https://www.wikidata.org/wiki/Q7978591","display_name":"Web modeling","level":3,"score":0.43275201320648193},{"id":"https://openalex.org/C162005631","wikidata":"https://www.wikidata.org/wiki/Q54837","display_name":"Data Web","level":3,"score":0.42980632185935974},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3538244962692261},{"id":"https://openalex.org/C35578498","wikidata":"https://www.wikidata.org/wiki/Q193424","display_name":"Web service","level":2,"score":0.2874850630760193},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.24910244345664978},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.09847334027290344},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2494188.2494193","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2494188.2494193","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 13th International Conference on Knowledge Management and Knowledge Technologies","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":11,"referenced_works":["https://openalex.org/W147081156","https://openalex.org/W1540364107","https://openalex.org/W1551262214","https://openalex.org/W1610212413","https://openalex.org/W2013781937","https://openalex.org/W2022164280","https://openalex.org/W2069818983","https://openalex.org/W2262562434","https://openalex.org/W4239696231","https://openalex.org/W4285719527","https://openalex.org/W7034308714"],"related_works":["https://openalex.org/W2187012497","https://openalex.org/W2945931694","https://openalex.org/W2184263241","https://openalex.org/W2134078223","https://openalex.org/W2415191659","https://openalex.org/W2542140006","https://openalex.org/W2182629206","https://openalex.org/W2288367326","https://openalex.org/W2744329849","https://openalex.org/W4385950365"],"abstract_inverted_index":{"The":[0,119],"Web":[1,6,13,31,66,111],"is":[2,42],"populated":[3],"with":[4],"many":[5],"sites":[7,14,67,112],"containing":[8],"unstructured":[9],"textual":[10],"information.":[11],"These":[12],"are":[15,26,51],"a":[16,88,107,114],"source":[17],"of":[18,36,60,109,126],"knowledge":[19,38,99],"for":[20,48,73,124],"various":[21,77,133],"interests.":[22],"As":[23],"semantic":[24],"annotations":[25],"only":[27],"rarely":[28],"used":[29],"on":[30,65,106],"sites,":[32],"an":[33],"automated":[34],"harvesting":[35],"the":[37,58,71,129],"without":[39],"additional":[40],"effort":[41],"not":[43],"possible.":[44],"Thus,":[45],"elaborated":[46],"approaches":[47],"information":[49],"extraction":[50],"required.":[52],"In":[53,79],"our":[54,83],"work":[55],"we":[56,69,85],"face":[57],"challenge":[59],"identifying":[61],"business":[62],"address":[63],"data":[64,75],"since":[68],"see":[70],"need":[72],"this":[74],"in":[76,132],"applications.":[78],"order":[80],"to":[81],"accomplish":[82],"aim,":[84],"have":[86],"developed":[87],"hybrid":[89],"approach":[90,120],"combining":[91],"patterns":[92],"and":[93,117],"gazetteers":[94],"obtained":[95],"from":[96],"freely":[97],"available":[98],"resources":[100],"such":[101],"as":[102],"OpenStreetMap.":[103],"Experimental":[104],"evaluation":[105],"corpus":[108],"heterogeneous":[110],"shows":[113],"high":[115],"recall":[116],"precision.":[118],"can":[121],"be":[122],"adapted":[123],"identification":[125],"addresses":[127],"considering":[128],"different":[130],"formats":[131],"countries.":[134]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":3},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":1},{"year":2014,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
