{"id":"https://openalex.org/W2559636315","doi":"https://doi.org/10.1109/cec.2016.7743805","title":"An automatic framework for entity matching in bibliographic databases","display_name":"An automatic framework for entity matching in bibliographic databases","publication_year":2016,"publication_date":"2016-07-01","ids":{"openalex":"https://openalex.org/W2559636315","doi":"https://doi.org/10.1109/cec.2016.7743805","mag":"2559636315"},"language":"en","primary_location":{"id":"doi:10.1109/cec.2016.7743805","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cec.2016.7743805","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE Congress on Evolutionary Computation (CEC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5021971352","display_name":"Sumit Mishra","orcid":"https://orcid.org/0000-0001-9333-2001"},"institutions":[{"id":"https://openalex.org/I132153292","display_name":"Indian Institute of Technology Patna","ror":"https://ror.org/01ft5vz71","country_code":"IN","type":"education","lineage":["https://openalex.org/I132153292"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Sumit Mishra","raw_affiliation_strings":["Department of Computer Science and Engineering, Indian Institute of Technology Patna, Patna, India"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Indian Institute of Technology Patna, Patna, India","institution_ids":["https://openalex.org/I132153292"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060797340","display_name":"Sriparna Saha","orcid":"https://orcid.org/0000-0001-5458-9381"},"institutions":[{"id":"https://openalex.org/I132153292","display_name":"Indian Institute of Technology Patna","ror":"https://ror.org/01ft5vz71","country_code":"IN","type":"education","lineage":["https://openalex.org/I132153292"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Sriparna Saha","raw_affiliation_strings":["Department of Computer Science and Engineering, Indian Institute of Technology Patna, Patna, India"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Indian Institute of Technology Patna, Patna, India","institution_ids":["https://openalex.org/I132153292"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5088675403","display_name":"Samrat Mondal","orcid":"https://orcid.org/0000-0002-2159-3410"},"institutions":[{"id":"https://openalex.org/I132153292","display_name":"Indian Institute of Technology Patna","ror":"https://ror.org/01ft5vz71","country_code":"IN","type":"education","lineage":["https://openalex.org/I132153292"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Samrat Mondal","raw_affiliation_strings":["Department of Computer Science and Engineering, Indian Institute of Technology Patna, Patna, India"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Indian Institute of Technology Patna, Patna, India","institution_ids":["https://openalex.org/I132153292"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5021971352"],"corresponding_institution_ids":["https://openalex.org/I132153292"],"apc_list":null,"apc_paid":null,"fwci":1.0772,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.82626337,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"2","issue":null,"first_page":"271","last_page":"278"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8169790506362915},{"id":"https://openalex.org/keywords/medoid","display_name":"Medoid","score":0.7212307453155518},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.6589044332504272},{"id":"https://openalex.org/keywords/sorting","display_name":"Sorting","score":0.6437775492668152},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.6309818625450134},{"id":"https://openalex.org/keywords/measure","display_name":"Measure (data warehouse)","score":0.623503565788269},{"id":"https://openalex.org/keywords/silhouette","display_name":"Silhouette","score":0.6154506206512451},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.6014282703399658},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5613794326782227},{"id":"https://openalex.org/keywords/index","display_name":"Index (typography)","score":0.49619704484939575},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.43590784072875977},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.299836665391922},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.24105292558670044},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.1052946150302887},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.09477713704109192}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8169790506362915},{"id":"https://openalex.org/C63085389","wikidata":"https://www.wikidata.org/wiki/Q4287912","display_name":"Medoid","level":3,"score":0.7212307453155518},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.6589044332504272},{"id":"https://openalex.org/C111696304","wikidata":"https://www.wikidata.org/wiki/Q2303697","display_name":"Sorting","level":2,"score":0.6437775492668152},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.6309818625450134},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.623503565788269},{"id":"https://openalex.org/C58103923","wikidata":"https://www.wikidata.org/wiki/Q2286025","display_name":"Silhouette","level":2,"score":0.6154506206512451},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.6014282703399658},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5613794326782227},{"id":"https://openalex.org/C2777382242","wikidata":"https://www.wikidata.org/wiki/Q6017816","display_name":"Index (typography)","level":2,"score":0.49619704484939575},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.43590784072875977},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.299836665391922},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.24105292558670044},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.1052946150302887},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09477713704109192},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cec.2016.7743805","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cec.2016.7743805","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE Congress on Evolutionary Computation (CEC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W24227368","https://openalex.org/W106880317","https://openalex.org/W149565845","https://openalex.org/W175950377","https://openalex.org/W1482827835","https://openalex.org/W1497256448","https://openalex.org/W1570834090","https://openalex.org/W1595498733","https://openalex.org/W1659842140","https://openalex.org/W1964786778","https://openalex.org/W1977340740","https://openalex.org/W1987971958","https://openalex.org/W1990421110","https://openalex.org/W1996747841","https://openalex.org/W2014964486","https://openalex.org/W2017555797","https://openalex.org/W2021297832","https://openalex.org/W2022322548","https://openalex.org/W2024770506","https://openalex.org/W2064886355","https://openalex.org/W2069756715","https://openalex.org/W2079567859","https://openalex.org/W2082696804","https://openalex.org/W2085045832","https://openalex.org/W2104051689","https://openalex.org/W2106521941","https://openalex.org/W2114764731","https://openalex.org/W2116661285","https://openalex.org/W2126105956","https://openalex.org/W2136517229","https://openalex.org/W2144358319","https://openalex.org/W2145893390","https://openalex.org/W2147347208","https://openalex.org/W2147437954","https://openalex.org/W2170589503","https://openalex.org/W2184875015","https://openalex.org/W2610904283","https://openalex.org/W4254788633","https://openalex.org/W6628772041","https://openalex.org/W6686826043"],"related_works":["https://openalex.org/W4297433771","https://openalex.org/W3047139727","https://openalex.org/W2357241418","https://openalex.org/W2991436424","https://openalex.org/W2792963552","https://openalex.org/W2086064646","https://openalex.org/W3201783519","https://openalex.org/W3203785702","https://openalex.org/W4286909549","https://openalex.org/W4285791430"],"abstract_inverted_index":{"Entity":[0],"matching":[1,80],"is":[2,12,144,175,226],"to":[3,7,183],"map":[4],"the":[5,8,22,29,36,78,94,140,159,165,170,185,199,223],"records":[6,107],"corresponding":[9],"entity.":[10],"It":[11],"a":[13],"well":[14,216],"known":[15,217],"problem":[16,91],"studied":[17],"by":[18],"many":[19],"researchers":[20],"over":[21,32],"last":[23],"few":[24],"years.":[25],"In":[26,84],"bibliographic":[27,49,203],"database,":[28],"data":[30,123,136,204],"evolve":[31],"time.":[33,53,72],"For":[34],"example,":[35],"email":[37],"id":[38],"of":[39,63,75,208],"an":[40,154],"author":[41],"in":[42],"DBLP":[43,219],"and":[44,92,220],"ArnetMiner":[45],"which":[46,157],"are":[47,181,195,211],"two":[48,214],"databases":[50],"changes":[51,70],"with":[52,65,71,164,192,213],"Authors":[54],"also":[55,69,145],"keep":[56],"on":[57],"changing":[58],"their":[59],"affiliations.":[60],"The":[61,103,206],"set":[62,124],"authors":[64],"whom":[66],"they":[67],"work":[68],"These":[73],"types":[74],"variations":[76],"make":[77],"entity":[79],"task":[81],"more":[82],"difficult.":[83,146],"this":[85,90,149,151],"paper,":[86],"we":[87],"have":[88],"addressed":[89],"proposed":[93,230],"nondominated":[95],"sorting":[96],"genetic":[97],"algorithm-II":[98],"(NSGA-II)":[99],"based":[100,173],"solution":[101],"framework.":[102],"dissimilarities":[104],"between":[105],"different":[106],"can":[108,118,130],"be":[109,119,131],"measured":[110],"using":[111],"various":[112],"distance":[113,116,128,142,161],"measures.":[114],"One":[115],"measure":[117,129,143,162],"suitable":[120,132,160],"for":[121,133,201],"one":[122],"while":[125],"some":[126,134],"other":[127,135],"sets.":[137,205],"So":[138],"selecting":[139],"appropriate":[141,166],"To":[147,168],"address":[148],"issue,":[150],"paper":[152],"presents":[153],"automatic":[155],"framework":[156],"selects":[158],"along":[163,191],"partitioning.":[167],"encode":[169],"partitions,":[171],"medoid":[172],"encoding":[174],"used.":[176],"Several":[177],"new":[178],"mutation":[179],"operations":[180],"used":[182],"explore":[184],"search":[186],"space":[187],"efficiently.":[188],"Silhouette":[189],"Index":[190,194],"Xie-Beni":[193],"optimized":[196],"simultaneously":[197],"during":[198],"experiments":[200],"three":[202],"results":[207,224],"our":[209,229],"approach":[210,231],"compared":[212],"existing":[215],"techniques,":[218],"ArnetMiner.":[221],"From":[222],"it":[225],"clear":[227],"that":[228],"performs":[232],"well.":[233]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
