{"id":"https://openalex.org/W2087483562","doi":"https://doi.org/10.1109/bhi.2014.6864381","title":"Implementation of an extended Fellegi-Sunter probabilistic record linkage method using the Jaro-Winkler string comparator","display_name":"Implementation of an extended Fellegi-Sunter probabilistic record linkage method using the Jaro-Winkler string comparator","publication_year":2014,"publication_date":"2014-06-01","ids":{"openalex":"https://openalex.org/W2087483562","doi":"https://doi.org/10.1109/bhi.2014.6864381","mag":"2087483562"},"language":"en","primary_location":{"id":"doi:10.1109/bhi.2014.6864381","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bhi.2014.6864381","pdf_url":null,"source":{"id":"https://openalex.org/S4393918972","display_name":"IEEE-EMBS International Conference on Biomedical and Health Informatics (BHI ...)","issn_l":"2641-3590","issn":["2641-3590"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE-EMBS International Conference on Biomedical and Health Informatics (BHI)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100381220","display_name":"Xinran Li","orcid":"https://orcid.org/0000-0002-5678-6829"},"institutions":[{"id":"https://openalex.org/I198244214","display_name":"Universit\u00e9 Clermont Auvergne","ror":"https://ror.org/01a8ajp46","country_code":"FR","type":"education","lineage":["https://openalex.org/I198244214"]},{"id":"https://openalex.org/I10342815","display_name":"International Space University","ror":"https://ror.org/04t6r6d34","country_code":"FR","type":"education","lineage":["https://openalex.org/I10342815"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Xinran Li","raw_affiliation_strings":["ISIT, Auvergne University, France","ISIT, Auvergne Univ., Clermont-Ferrand, France"],"affiliations":[{"raw_affiliation_string":"ISIT, Auvergne University, France","institution_ids":["https://openalex.org/I10342815"]},{"raw_affiliation_string":"ISIT, Auvergne Univ., Clermont-Ferrand, France","institution_ids":["https://openalex.org/I198244214"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033802430","display_name":"Aline Guttmann","orcid":"https://orcid.org/0000-0003-0162-837X"},"institutions":[{"id":"https://openalex.org/I198244214","display_name":"Universit\u00e9 Clermont Auvergne","ror":"https://ror.org/01a8ajp46","country_code":"FR","type":"education","lineage":["https://openalex.org/I198244214"]},{"id":"https://openalex.org/I10342815","display_name":"International Space University","ror":"https://ror.org/04t6r6d34","country_code":"FR","type":"education","lineage":["https://openalex.org/I10342815"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Aline Guttmann","raw_affiliation_strings":["ISIT, Auvergne University, France","ISIT, Auvergne Univ., Clermont-Ferrand, France"],"affiliations":[{"raw_affiliation_string":"ISIT, Auvergne University, France","institution_ids":["https://openalex.org/I10342815"]},{"raw_affiliation_string":"ISIT, Auvergne Univ., Clermont-Ferrand, France","institution_ids":["https://openalex.org/I198244214"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015066436","display_name":"S\u00e9bastien Cipi\u00e8re","orcid":null},"institutions":[{"id":"https://openalex.org/I198244214","display_name":"Universit\u00e9 Clermont Auvergne","ror":"https://ror.org/01a8ajp46","country_code":"FR","type":"education","lineage":["https://openalex.org/I198244214"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Sebastien Cipiere","raw_affiliation_strings":["LPC, Blaise Pascal University, France","LPC, Blaise Pascal Univ., Clermont-Ferrand, France"],"affiliations":[{"raw_affiliation_string":"LPC, Blaise Pascal University, France","institution_ids":["https://openalex.org/I198244214"]},{"raw_affiliation_string":"LPC, Blaise Pascal Univ., Clermont-Ferrand, France","institution_ids":["https://openalex.org/I198244214"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049906273","display_name":"Lydia Maigne","orcid":"https://orcid.org/0000-0002-0414-8462"},"institutions":[{"id":"https://openalex.org/I198244214","display_name":"Universit\u00e9 Clermont Auvergne","ror":"https://ror.org/01a8ajp46","country_code":"FR","type":"education","lineage":["https://openalex.org/I198244214"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Lydia Maigne","raw_affiliation_strings":["LPC, Blaise Pascal University, France","LPC, Blaise Pascal Univ., Clermont-Ferrand, France"],"affiliations":[{"raw_affiliation_string":"LPC, Blaise Pascal University, France","institution_ids":["https://openalex.org/I198244214"]},{"raw_affiliation_string":"LPC, Blaise Pascal Univ., Clermont-Ferrand, France","institution_ids":["https://openalex.org/I198244214"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040800580","display_name":"Jacques Demongeot","orcid":"https://orcid.org/0000-0002-8335-9240"},"institutions":[{"id":"https://openalex.org/I177483745","display_name":"Universit\u00e9 Joseph Fourier","ror":"https://ror.org/02aj0kh94","country_code":"FR","type":"education","lineage":["https://openalex.org/I177483745"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Jacques Demongeot","raw_affiliation_strings":["AGIM, School of Medicine, Grenoble, France","La Tronche Sch. of Med., AGIM, Joseph Fourier Univ., Grenoble, France"],"affiliations":[{"raw_affiliation_string":"AGIM, School of Medicine, Grenoble, France","institution_ids":[]},{"raw_affiliation_string":"La Tronche Sch. of Med., AGIM, Joseph Fourier Univ., Grenoble, France","institution_ids":["https://openalex.org/I177483745"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110019157","display_name":"Jean\u2010Yves Boire","orcid":null},"institutions":[{"id":"https://openalex.org/I10342815","display_name":"International Space University","ror":"https://ror.org/04t6r6d34","country_code":"FR","type":"education","lineage":["https://openalex.org/I10342815"]},{"id":"https://openalex.org/I198244214","display_name":"Universit\u00e9 Clermont Auvergne","ror":"https://ror.org/01a8ajp46","country_code":"FR","type":"education","lineage":["https://openalex.org/I198244214"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Jean-Yves Boire","raw_affiliation_strings":["ISIT, Auvergne University, France","ISIT, Auvergne Univ., Clermont-Ferrand, France"],"affiliations":[{"raw_affiliation_string":"ISIT, Auvergne University, France","institution_ids":["https://openalex.org/I10342815"]},{"raw_affiliation_string":"ISIT, Auvergne Univ., Clermont-Ferrand, France","institution_ids":["https://openalex.org/I198244214"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5006455729","display_name":"Lemlih Ouchchane","orcid":"https://orcid.org/0000-0003-0717-3150"},"institutions":[{"id":"https://openalex.org/I198244214","display_name":"Universit\u00e9 Clermont Auvergne","ror":"https://ror.org/01a8ajp46","country_code":"FR","type":"education","lineage":["https://openalex.org/I198244214"]},{"id":"https://openalex.org/I10342815","display_name":"International Space University","ror":"https://ror.org/04t6r6d34","country_code":"FR","type":"education","lineage":["https://openalex.org/I10342815"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Lemlih Ouchchane","raw_affiliation_strings":["ISIT, Auvergne University, France","ISIT, Auvergne Univ., Clermont-Ferrand, France"],"affiliations":[{"raw_affiliation_string":"ISIT, Auvergne University, France","institution_ids":["https://openalex.org/I10342815"]},{"raw_affiliation_string":"ISIT, Auvergne Univ., Clermont-Ferrand, France","institution_ids":["https://openalex.org/I198244214"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5100381220"],"corresponding_institution_ids":["https://openalex.org/I10342815","https://openalex.org/I198244214"],"apc_list":null,"apc_paid":null,"fwci":3.3773,"has_fulltext":false,"cited_by_count":18,"citation_normalized_percentile":{"value":0.92807746,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"60","issue":null,"first_page":"375","last_page":"379"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9733999967575073,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9106000065803528,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/record-linkage","display_name":"Record linkage","score":0.8089733123779297},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.6773989796638489},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6528561115264893},{"id":"https://openalex.org/keywords/linkage","display_name":"Linkage (software)","score":0.5640656352043152},{"id":"https://openalex.org/keywords/string","display_name":"String (physics)","score":0.5290966033935547},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.5269694328308105},{"id":"https://openalex.org/keywords/maximization","display_name":"Maximization","score":0.5068596005439758},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4681333005428314},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.44164690375328064},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.4348582923412323},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3700402081012726},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3452926278114319},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.29455018043518066},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.10181871056556702}],"concepts":[{"id":"https://openalex.org/C142210648","wikidata":"https://www.wikidata.org/wiki/Q1266546","display_name":"Record linkage","level":3,"score":0.8089733123779297},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.6773989796638489},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6528561115264893},{"id":"https://openalex.org/C31266012","wikidata":"https://www.wikidata.org/wiki/Q6554340","display_name":"Linkage (software)","level":3,"score":0.5640656352043152},{"id":"https://openalex.org/C157486923","wikidata":"https://www.wikidata.org/wiki/Q1376436","display_name":"String (physics)","level":2,"score":0.5290966033935547},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.5269694328308105},{"id":"https://openalex.org/C2776330181","wikidata":"https://www.wikidata.org/wiki/Q18358244","display_name":"Maximization","level":2,"score":0.5068596005439758},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4681333005428314},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.44164690375328064},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.4348582923412323},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3700402081012726},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3452926278114319},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.29455018043518066},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.10181871056556702},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C2908647359","wikidata":"https://www.wikidata.org/wiki/Q2625603","display_name":"Population","level":2,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C37914503","wikidata":"https://www.wikidata.org/wiki/Q156495","display_name":"Mathematical physics","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C149923435","wikidata":"https://www.wikidata.org/wiki/Q37732","display_name":"Demography","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bhi.2014.6864381","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bhi.2014.6864381","pdf_url":null,"source":{"id":"https://openalex.org/S4393918972","display_name":"IEEE-EMBS International Conference on Biomedical and Health Informatics (BHI ...)","issn_l":"2641-3590","issn":["2641-3590"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE-EMBS International Conference on Biomedical and Health Informatics (BHI)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5099999904632568,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W41404523","https://openalex.org/W1570596343","https://openalex.org/W1964584862","https://openalex.org/W1985690171","https://openalex.org/W1990028388","https://openalex.org/W2004918398","https://openalex.org/W2024018837","https://openalex.org/W2028251458","https://openalex.org/W2034190452","https://openalex.org/W2049633694","https://openalex.org/W2101508813","https://openalex.org/W2114793173","https://openalex.org/W2128600649","https://openalex.org/W2171033594","https://openalex.org/W2794286494","https://openalex.org/W4230502578","https://openalex.org/W4242744113","https://openalex.org/W6633928172"],"related_works":["https://openalex.org/W2487032012","https://openalex.org/W2211355040","https://openalex.org/W2808916796","https://openalex.org/W1501601012","https://openalex.org/W2176311362","https://openalex.org/W3088855600","https://openalex.org/W3012491082","https://openalex.org/W3211905090","https://openalex.org/W2178148352","https://openalex.org/W1936317645"],"abstract_inverted_index":{"Record":[0,62],"linkage":[1,44,127],"is":[2,45,55,103,115],"the":[3,17,40,79,89,100,107,110,136,144,148,152,162,181],"task":[4],"of":[5,60,78,91,99,112,123,147,161,183],"identifying":[6],"which":[7],"records":[8,21],"from":[9],"one":[10],"or":[11],"more":[12],"data":[13,157],"sources":[14],"refer":[15],"to":[16,134,165,170,179],"same":[18],"person.":[19],"Often,":[20],"do":[22],"not":[23],"have":[24],"a":[25,38,46,53,67],"common":[26],"key":[27],"and":[28,93,129,141,169,173,186],"may":[29],"contain":[30],"typographical":[31],"variations":[32],"in":[33,36,88,106,131],"identifier":[34],"fields,":[35],"such":[37],"case,":[39],"Fellegi-Sunter":[41,80,101,174],"probabilistic":[42],"record":[43,126],"method":[47,81,102,114,150],"commonly":[48],"used.":[49],"In":[50],"this":[51],"method,":[52],"weight":[54],"assigned":[56],"for":[57],"each":[58],"pair":[59],"records.":[61],"pairs":[63],"with":[64],"weights":[65],"above":[66],"given":[68],"threshold":[69],"are":[70],"considered":[71],"as":[72],"matches.":[73],"Winkler":[74,113,137,149,172],"introduced":[75],"an":[76],"extension":[77],"that":[82],"takes":[83],"into":[84],"account":[85],"field":[86],"similarity":[87],"calculation":[90],"weight,":[92],"proved":[94],"its":[95],"outperformance.":[96],"The":[97],"implementation":[98],"frequently":[104],"presented":[105],"literature,":[108],"however,":[109],"application":[111],"rarely":[116],"mentioned.":[117],"This":[118],"paper":[119],"presents":[120],"brief":[121],"backgrounds":[122],"these":[124],"two":[125],"methods,":[128],"describes":[130],"details":[132],"how":[133],"implement":[135],"method.":[138],"We":[139],"formalized":[140],"then":[142],"estimated":[143],"required":[145],"parameters":[146],"using":[151],"expectation-maximization":[153],"(EM)":[154],"algorithm.":[155],"Simulated":[156],"sets-with":[158],"known":[159],"truth":[160],"matches-were":[163],"used":[164],"assess":[166],"parameters'":[167],"estimation":[168],"compare":[171],"methods":[175],"regarding":[176],"their":[177],"ability":[178],"reduce":[180],"rates":[182],"false":[184,187],"matches":[185],"non-matches.":[188]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":3},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":2},{"year":2014,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
