{"id":"https://openalex.org/W2139423731","doi":"https://doi.org/10.1145/2516633.2516638","title":"The parallel path framework for entity discovery on the web","display_name":"The parallel path framework for entity discovery on the web","publication_year":2013,"publication_date":"2013-09-01","ids":{"openalex":"https://openalex.org/W2139423731","doi":"https://doi.org/10.1145/2516633.2516638","mag":"2139423731"},"language":"en","primary_location":{"id":"doi:10.1145/2516633.2516638","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2516633.2516638","pdf_url":null,"source":{"id":"https://openalex.org/S131231701","display_name":"ACM Transactions on the Web","issn_l":"1559-1131","issn":["1559-1131","1559-114X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on the Web","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5084597959","display_name":"Tim Weninger","orcid":"https://orcid.org/0000-0003-3164-2615"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Tim Weninger","raw_affiliation_strings":["University of Illinois at Urbana-Champaign","University of Illinois at Urbana Champaign"],"affiliations":[{"raw_affiliation_string":"University of Illinois at Urbana-Champaign","institution_ids":["https://openalex.org/I157725225"]},{"raw_affiliation_string":"University of Illinois at Urbana Champaign","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110622330","display_name":"Thomas J. Johnston","orcid":null},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Thomas J. Johnston","raw_affiliation_strings":["University of Illinois at Urbana-Champaign","University of Illinois at Urbana Champaign"],"affiliations":[{"raw_affiliation_string":"University of Illinois at Urbana-Champaign","institution_ids":["https://openalex.org/I157725225"]},{"raw_affiliation_string":"University of Illinois at Urbana Champaign","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103750286","display_name":"Jiawei Han","orcid":null},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jiawei Han","raw_affiliation_strings":["University of Illinois at Urbana-Champaign","University of Illinois at Urbana Champaign"],"affiliations":[{"raw_affiliation_string":"University of Illinois at Urbana-Champaign","institution_ids":["https://openalex.org/I157725225"]},{"raw_affiliation_string":"University of Illinois at Urbana Champaign","institution_ids":["https://openalex.org/I157725225"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5084597959"],"corresponding_institution_ids":["https://openalex.org/I157725225"],"apc_list":null,"apc_paid":null,"fwci":2.4269,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.91523934,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"7","issue":"3","first_page":"1","last_page":"29"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13976","display_name":"Web visibility and informetrics","score":0.9952999949455261,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9783999919891357,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8236890435218811},{"id":"https://openalex.org/keywords/web-page","display_name":"Web page","score":0.6525033116340637},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.6068350076675415},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5853854417800903},{"id":"https://openalex.org/keywords/static-web-page","display_name":"Static web page","score":0.5293465256690979},{"id":"https://openalex.org/keywords/path","display_name":"Path (computing)","score":0.4517967402935028},{"id":"https://openalex.org/keywords/web-mining","display_name":"Web mining","score":0.42503926157951355},{"id":"https://openalex.org/keywords/web-navigation","display_name":"Web navigation","score":0.28090065717697144}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8236890435218811},{"id":"https://openalex.org/C21959979","wikidata":"https://www.wikidata.org/wiki/Q36774","display_name":"Web page","level":2,"score":0.6525033116340637},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.6068350076675415},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5853854417800903},{"id":"https://openalex.org/C173576120","wikidata":"https://www.wikidata.org/wiki/Q2641220","display_name":"Static web page","level":4,"score":0.5293465256690979},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.4517967402935028},{"id":"https://openalex.org/C197046077","wikidata":"https://www.wikidata.org/wiki/Q785337","display_name":"Web mining","level":3,"score":0.42503926157951355},{"id":"https://openalex.org/C61096286","wikidata":"https://www.wikidata.org/wiki/Q7978592","display_name":"Web navigation","level":3,"score":0.28090065717697144},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2516633.2516638","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2516633.2516638","pdf_url":null,"source":{"id":"https://openalex.org/S131231701","display_name":"ACM Transactions on the Web","issn_l":"1559-1131","issn":["1559-1131","1559-114X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on the Web","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4399999976158142,"id":"https://metadata.un.org/sdg/17","display_name":"Partnerships for the goals"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320332467","display_name":"U.S. Air Force","ror":"https://ror.org/006gmme17"},{"id":"https://openalex.org/F4320337389","display_name":"Division of Information and Intelligent Systems","ror":"https://ror.org/053a2cp42"},{"id":"https://openalex.org/F4320338295","display_name":"Army Research Laboratory","ror":"https://ror.org/011hc8f90"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W140787242","https://openalex.org/W1489843519","https://openalex.org/W1965605976","https://openalex.org/W1988623849","https://openalex.org/W2004227778","https://openalex.org/W2005207065","https://openalex.org/W2011282943","https://openalex.org/W2015551056","https://openalex.org/W2024129947","https://openalex.org/W2036100275","https://openalex.org/W2049048440","https://openalex.org/W2049365470","https://openalex.org/W2059586463","https://openalex.org/W2075100598","https://openalex.org/W2088179629","https://openalex.org/W2092590954","https://openalex.org/W2096496923","https://openalex.org/W2102189859","https://openalex.org/W2104086170","https://openalex.org/W2108126629","https://openalex.org/W2108223890","https://openalex.org/W2111869785","https://openalex.org/W2117510361","https://openalex.org/W2128549493","https://openalex.org/W2140116426","https://openalex.org/W2143519641","https://openalex.org/W2145007893","https://openalex.org/W2146001804","https://openalex.org/W2153466602","https://openalex.org/W2153642258","https://openalex.org/W2156772624","https://openalex.org/W2160189941","https://openalex.org/W2167894050","https://openalex.org/W2168358004","https://openalex.org/W2170188121","https://openalex.org/W2171364811","https://openalex.org/W2284650288","https://openalex.org/W4240555197"],"related_works":["https://openalex.org/W1979144454","https://openalex.org/W2069679074","https://openalex.org/W4239898202","https://openalex.org/W3116613346","https://openalex.org/W1559090489","https://openalex.org/W2168047402","https://openalex.org/W2115253914","https://openalex.org/W2316185946","https://openalex.org/W2000745862","https://openalex.org/W2376574812"],"abstract_inverted_index":{"It":[0],"has":[1],"been":[2],"a":[3,52,99,110,164,210],"dream":[4],"of":[5,16,26,45,60,105,129,132,147,206],"the":[6,13,17,22,27,43,56,79,85,106,130,133,141,148,174,204],"database":[7,28],"and":[8,58,81,101,113,119,177,180,199],"Web":[9,20,38,86,90,111,165,175],"communities":[10],"to":[11,36,68,87,98,126],"reconcile":[12],"unstructured":[14],"nature":[15],"World":[18],"Wide":[19],"with":[21,209],"neat,":[23],"structured":[24],"schemas":[25,44],"paradigm.":[29],"Even":[30],"though":[31],"databases":[32,47],"are":[33,48],"currently":[34],"used":[35],"generate":[37],"content":[39],"in":[40,140],"some":[41],"sites,":[42],"these":[46,191],"rarely":[49],"consistent":[50],"across":[51],"domain.":[53],"This":[54],"makes":[55],"comparison":[57],"aggregation":[59],"information":[61,83,184],"from":[62],"different":[63],"domains":[64],"difficult.":[65],"We":[66,186],"aim":[67],"make":[69],"an":[70,114],"important":[71],"step":[72],"towards":[73],"resolving":[74],"this":[75],"disparity":[76],"by":[77,189],"using":[78],"structural":[80],"relational":[82],"on":[84],"(1)":[88],"extract":[89,103],"lists,":[91],"(2)":[92],"find":[93,127],"entity-pages,":[94],"(3)":[95],"map":[96],"entity-pages":[97,131,198],"database,":[100],"(4)":[102],"attributes":[104,146],"entities.":[107],"Specifically,":[108],"given":[109],"site":[112],"entity-page":[115],"(e.g.,":[116,136,151],"university":[117],"department":[118],"faculty":[120,138],"member":[121],"home":[122],"page)":[123],"we":[124,162,194,202],"seek":[125],"all":[128,137],"same":[134],"type":[135],"members":[139],"department),":[142],"as":[143,145],"well":[144],"specific":[149],"entities":[150],"their":[152],"phone":[153],"numbers,":[154],"email":[155],"addresses,":[156],"office":[157],"numbers).":[158],"To":[159],"do":[160],"this,":[161],"propose":[163],"structure":[166],"mining":[167],"method":[168,208],"which":[169],"grows":[170],"parallel":[171,192],"paths":[172,193],"through":[173],"graph":[176],"DOM":[178],"trees":[179],"propagates":[181],"relevant":[182],"attribute":[183],"forward.":[185],"show":[187],"that":[188],"utilizing":[190],"can":[195],"efficiently":[196],"discover":[197],"attributes.":[200],"Finally,":[201],"demonstrate":[203],"accuracy":[205],"our":[207],"large":[211],"case":[212],"study.":[213]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2017,"cited_by_count":2},{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
