{"id":"https://openalex.org/W2012297991","doi":"https://doi.org/10.4304/jcp.5.11.1646-1654","title":"Exploiting Location-aware Mechanism for Distributed Web Crawling over DHTs","display_name":"Exploiting Location-aware Mechanism for Distributed Web Crawling over DHTs","publication_year":2010,"publication_date":"2010-11-01","ids":{"openalex":"https://openalex.org/W2012297991","doi":"https://doi.org/10.4304/jcp.5.11.1646-1654","mag":"2012297991"},"language":"en","primary_location":{"id":"doi:10.4304/jcp.5.11.1646-1654","is_oa":false,"landing_page_url":"https://doi.org/10.4304/jcp.5.11.1646-1654","pdf_url":null,"source":{"id":"https://openalex.org/S77894049","display_name":"Journal of Computers","issn_l":"1796-203X","issn":["1796-203X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310318660","host_organization_name":"Academy Publisher","host_organization_lineage":["https://openalex.org/P4310318660"],"host_organization_lineage_names":["Academy Publisher"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Computers","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100319784","display_name":"Xu Xiao\ue00b","orcid":"https://orcid.org/0000-0001-5774-1094"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Xiao Xu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085221201","display_name":"Weizhe Zhang","orcid":"https://orcid.org/0000-0003-4783-876X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Weizhe Zhang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100417312","display_name":"Hongli Zhang","orcid":"https://orcid.org/0000-0002-8167-7106"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hongli Zhang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5113587199","display_name":"Binxing Fang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Binxing Fang","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100319784"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.12397104,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"5","issue":"11","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10742","display_name":"Peer-to-Peer Network Technologies","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10742","display_name":"Peer-to-Peer Network Technologies","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/crawling","display_name":"Crawling","score":0.8741768002510071},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8018496036529541},{"id":"https://openalex.org/keywords/mechanism","display_name":"Mechanism (biology)","score":0.6366611123085022},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.42278552055358887},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.34591615200042725},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.07254469394683838}],"concepts":[{"id":"https://openalex.org/C100368936","wikidata":"https://www.wikidata.org/wiki/Q1411725","display_name":"Crawling","level":2,"score":0.8741768002510071},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8018496036529541},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.6366611123085022},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.42278552055358887},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.34591615200042725},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.07254469394683838},{"id":"https://openalex.org/C105702510","wikidata":"https://www.wikidata.org/wiki/Q514","display_name":"Anatomy","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.4304/jcp.5.11.1646-1654","is_oa":false,"landing_page_url":"https://doi.org/10.4304/jcp.5.11.1646-1654","pdf_url":null,"source":{"id":"https://openalex.org/S77894049","display_name":"Journal of Computers","issn_l":"1796-203X","issn":["1796-203X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310318660","host_organization_name":"Academy Publisher","host_organization_lineage":["https://openalex.org/P4310318660"],"host_organization_lineage_names":["Academy Publisher"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Computers","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure","score":0.6399999856948853}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W71185953","https://openalex.org/W77011704","https://openalex.org/W134713352","https://openalex.org/W141905930","https://openalex.org/W1526112125","https://openalex.org/W1613836731","https://openalex.org/W1758648065","https://openalex.org/W1761577731","https://openalex.org/W2000273502","https://openalex.org/W2006115592","https://openalex.org/W2020765652","https://openalex.org/W2059302649","https://openalex.org/W2066636486","https://openalex.org/W2104417748","https://openalex.org/W2106532810","https://openalex.org/W2117311042","https://openalex.org/W2127441060","https://openalex.org/W2132051999","https://openalex.org/W2133843880","https://openalex.org/W2134261469","https://openalex.org/W2150064865","https://openalex.org/W2158049821","https://openalex.org/W2159692093","https://openalex.org/W2163059190","https://openalex.org/W2168905685","https://openalex.org/W2295141584"],"related_works":["https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W4321258516","https://openalex.org/W2051833850","https://openalex.org/W914962000","https://openalex.org/W2159872134","https://openalex.org/W4299833833","https://openalex.org/W2795447506","https://openalex.org/W2152505903","https://openalex.org/W2963942219"],"abstract_inverted_index":{"Inspired":[0],"by":[1,59,163],"the":[2,16,19,34,38,46,49,54,61,67,80,90,97,155,165],"concept":[3],"of":[4,18,37,48,70,88,157],"internet":[5],"computing,":[6],"DHT-based":[7,120],"distributed":[8,115,121],"Web":[9,21,39,116,122],"crawling":[10,22,40,123],"model":[11,124],"is":[12,57,125,140,160],"proposed":[13,126,141],"to":[14,32,44,108],"solve":[15],"bottlenecks":[17],"traditional":[20],"systems.":[23],"Based":[24],"on":[25,53,96,103,136],"this":[26,130],"system":[27],"model,":[28,131],"we":[29],"propose":[30],"optimizations":[31],"reduce":[33],"download":[35,55],"time":[36,56],"tasks":[41],"in":[42,147],"order":[43],"increase":[45],"efficiency":[47],"system.":[50],"The":[51],"improvement":[52],"achieved":[58],"shortening":[60],"crawler-crawlee":[62,148],"network":[63],"distance.":[64],"By":[65],"utilizing":[66],"mapping":[68],"mechanism":[69],"Content":[71],"Addressable":[72],"Network":[73,76],"(CAN)":[74],"over":[75],"Coordinate":[77],"System":[78],"(NC),":[79],"issue":[81,156],"can":[82],"be":[83],"mapped":[84],"onto":[85],"a":[86,132,144],"problem":[87],"minimizing":[89],"distances":[91],"between":[92],"peers":[93],"and":[94],"resources":[95],"DHT":[98],"overlay.":[99],"This":[100],"paper":[101],"focuses":[102],"reducing":[104],"such":[105],"distances,":[106],"seeking":[107],"provide":[109],"an":[110],"improved":[111],"location-aware":[112],"infrastructure":[113],"for":[114],"crawling.":[117],"A":[118],"new":[119,133,166],"first.":[127],"Then,":[128],"under":[129],"method":[134,167],"based":[135],"CAN\u2019s":[137],"splitting":[138],"schemes":[139],"which":[142],"shows":[143],"significant":[145],"decrease":[146],"distance":[149],"against":[150],"existing":[151],"schemes.":[152],"In":[153],"addition,":[154],"load":[158],"balancing":[159],"also":[161],"solved":[162],"combining":[164],"with":[168],"old":[169],"ones.":[170]},"counts_by_year":[{"year":2019,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
