{"id":"https://openalex.org/W2005508116","doi":"https://doi.org/10.1145/2339530.2339753","title":"LIEGE:","display_name":"LIEGE:","publication_year":2012,"publication_date":"2012-08-12","ids":{"openalex":"https://openalex.org/W2005508116","doi":"https://doi.org/10.1145/2339530.2339753","mag":"2005508116"},"language":"en","primary_location":{"id":"doi:10.1145/2339530.2339753","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2339530.2339753","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 18th ACM SIGKDD international conference on Knowledge discovery and data mining","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101956272","display_name":"Wei Shen","orcid":"https://orcid.org/0000-0003-3479-1165"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Wei Shen","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100630868","display_name":"Jianyong Wang","orcid":"https://orcid.org/0000-0002-7555-170X"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianyong Wang","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100752685","display_name":"Ping Luo","orcid":"https://orcid.org/0000-0002-6645-4721"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ping Luo","raw_affiliation_strings":["HP Labs China, Beijing, China","HP Labs China Beijing, China#TAB#"],"affiliations":[{"raw_affiliation_string":"HP Labs China, Beijing, China","institution_ids":[]},{"raw_affiliation_string":"HP Labs China Beijing, China#TAB#","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100340891","display_name":"Min Wang","orcid":"https://orcid.org/0000-0002-1580-6387"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Min Wang","raw_affiliation_strings":["HP Labs China, Beijing, China","HP Labs China Beijing, China#TAB#"],"affiliations":[{"raw_affiliation_string":"HP Labs China, Beijing, China","institution_ids":[]},{"raw_affiliation_string":"HP Labs China Beijing, China#TAB#","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5101956272"],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":9.2371,"has_fulltext":false,"cited_by_count":54,"citation_normalized_percentile":{"value":0.97472497,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1424","last_page":"1432"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8630056381225586},{"id":"https://openalex.org/keywords/entity-linking","display_name":"Entity linking","score":0.6996012926101685},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.6238433718681335},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.552517294883728},{"id":"https://openalex.org/keywords/knowledge-base","display_name":"Knowledge base","score":0.515238344669342},{"id":"https://openalex.org/keywords/web-page","display_name":"Web page","score":0.47698384523391724},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.4439815580844879},{"id":"https://openalex.org/keywords/social-semantic-web","display_name":"Social Semantic Web","score":0.4307634234428406},{"id":"https://openalex.org/keywords/data-web","display_name":"Data Web","score":0.4149402976036072},{"id":"https://openalex.org/keywords/semantic-web","display_name":"Semantic Web","score":0.3652611970901489},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.16977643966674805}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8630056381225586},{"id":"https://openalex.org/C96711827","wikidata":"https://www.wikidata.org/wiki/Q17012245","display_name":"Entity linking","level":3,"score":0.6996012926101685},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.6238433718681335},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.552517294883728},{"id":"https://openalex.org/C4554734","wikidata":"https://www.wikidata.org/wiki/Q593744","display_name":"Knowledge base","level":2,"score":0.515238344669342},{"id":"https://openalex.org/C21959979","wikidata":"https://www.wikidata.org/wiki/Q36774","display_name":"Web page","level":2,"score":0.47698384523391724},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.4439815580844879},{"id":"https://openalex.org/C534406577","wikidata":"https://www.wikidata.org/wiki/Q7550843","display_name":"Social Semantic Web","level":3,"score":0.4307634234428406},{"id":"https://openalex.org/C162005631","wikidata":"https://www.wikidata.org/wiki/Q54837","display_name":"Data Web","level":3,"score":0.4149402976036072},{"id":"https://openalex.org/C2129575","wikidata":"https://www.wikidata.org/wiki/Q54837","display_name":"Semantic Web","level":2,"score":0.3652611970901489},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.16977643966674805}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2339530.2339753","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2339530.2339753","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 18th ACM SIGKDD international conference on Knowledge discovery and data mining","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W86887328","https://openalex.org/W102708294","https://openalex.org/W1541691357","https://openalex.org/W1548663377","https://openalex.org/W1647729745","https://openalex.org/W1993715838","https://openalex.org/W2011039300","https://openalex.org/W2022166150","https://openalex.org/W2038721957","https://openalex.org/W2092364718","https://openalex.org/W2108223890","https://openalex.org/W2111869785","https://openalex.org/W2114544510","https://openalex.org/W2115352105","https://openalex.org/W2115461474","https://openalex.org/W2124067180","https://openalex.org/W2135767707","https://openalex.org/W2140428995","https://openalex.org/W2145007893","https://openalex.org/W2146304342","https://openalex.org/W2148738951","https://openalex.org/W2150721933","https://openalex.org/W2162638401","https://openalex.org/W2882319491","https://openalex.org/W4235505822","https://openalex.org/W6636975626"],"related_works":["https://openalex.org/W2069569467","https://openalex.org/W2349698472","https://openalex.org/W2183626957","https://openalex.org/W2279098064","https://openalex.org/W2378922560","https://openalex.org/W2363068772","https://openalex.org/W1975429881","https://openalex.org/W2113445341","https://openalex.org/W2551975015","https://openalex.org/W2059445287"],"abstract_inverted_index":{"A":[0],"critical":[1],"step":[2],"in":[3,25,35,110,129,148,155,184,194,271],"bridging":[4],"the":[5,9,20,26,30,36,63,79,93,102,108,114,118,141,152,167,176,180,185,199,215,221,224,228,235,250,259,268],"knowledge":[6,37,54,115],"base":[7,55,116],"with":[8,29,113,159],"huge":[10],"corpus":[11],"of":[12,88,120,137,170,182,201,223,237,273],"semi-structured":[13],"Web":[14,27,71,94,131,157,186,196,229,246,251],"list":[15,42,64,72,87,132,153,158,197,203,230],"data":[16,256],"is":[17,67,85,125],"to":[18,106,117,218],"link":[19],"entity":[21,57,89,172,192],"mentions":[22,90],"that":[23,126,139,145,161,263],"appear":[24],"lists":[28,112,247],"corresponding":[31],"real":[32,245],"world":[33],"entities":[34,109,127,138,160,183,226],"base,":[38],"which":[39],"we":[40,99,165,208],"call":[41],"linking":[43,65,204],"task.":[44],"This":[45],"task":[46,66,84],"can":[47,133],"facilitate":[48],"many":[49],"different":[50,191],"tasks":[51],"such":[52],"as":[53],"population,":[56],"search":[58],"and":[59,78,175,253,258],"table":[60],"annotation.":[61],"However,":[62],"challenging":[68],"because":[69],"a":[70,86,130,156,195,210],"has":[73],"almost":[74],"no":[75],"textual":[76],"context,":[77],"only":[80],"input":[81],"for":[82,227],"this":[83,97,202],"extracted":[91,248],"from":[92,249],"pages.":[95],"In":[96],"paper,":[98],"propose":[100,209],"LIEGE,":[101],"first":[103],"general":[104],"framework":[105,240,265],"Link":[107],"web":[111],"best":[119],"our":[121,238,264],"knowledge.":[122],"Our":[123],"assumption":[124],"mentioned":[128,174],"be":[134],"any":[135],"collection":[136],"have":[140,147],"same":[142],"conceptual":[143],"type":[144],"people":[146],"mind.":[149],"To":[150],"annotate":[151],"items":[154],"they":[162],"likely":[163],"mention,":[164],"leverage":[166],"prior":[168],"probability":[169],"an":[171],"being":[173],"global":[177],"coherence":[178],"between":[179,190],"types":[181],"list.":[187],"The":[188],"interdependence":[189],"assignments":[193],"makes":[198],"optimization":[200],"problem":[205],"NP-hard.":[206],"Accordingly,":[207],"practical":[211],"solution":[212],"based":[213],"on":[214],"iterative":[216],"substitution":[217],"jointly":[219],"optimize":[220],"identification":[222],"mapping":[225],"items.":[231],"We":[232],"extensively":[233],"evaluated":[234],"performance":[236],"proposed":[239],"over":[241],"both":[242],"manually":[243],"annotated":[244],"pages":[252],"two":[254],"public":[255],"sets,":[257],"experimental":[260],"results":[261],"show":[262],"significantly":[266],"outperforms":[267],"baseline":[269],"method":[270],"terms":[272],"accuracy.":[274]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2021,"cited_by_count":5},{"year":2020,"cited_by_count":7},{"year":2019,"cited_by_count":6},{"year":2018,"cited_by_count":10},{"year":2017,"cited_by_count":7},{"year":2016,"cited_by_count":4},{"year":2015,"cited_by_count":2},{"year":2014,"cited_by_count":5},{"year":2013,"cited_by_count":5},{"year":2012,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2016-06-24T00:00:00"}
