{"id":"https://openalex.org/W2132422204","doi":"https://doi.org/10.1109/icmlc.2011.6016959","title":"A peer-to-peer based passive web crawling system","display_name":"A peer-to-peer based passive web crawling system","publication_year":2011,"publication_date":"2011-07-01","ids":{"openalex":"https://openalex.org/W2132422204","doi":"https://doi.org/10.1109/icmlc.2011.6016959","mag":"2132422204"},"language":"en","primary_location":{"id":"doi:10.1109/icmlc.2011.6016959","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icmlc.2011.6016959","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2011 International Conference on Machine Learning and Cybernetics","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110477928","display_name":"Qingcai Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]},{"id":"https://openalex.org/I158809036","display_name":"Shenzhen Institute of Information Technology","ror":"https://ror.org/03wrf9427","country_code":"CN","type":"education","lineage":["https://openalex.org/I158809036"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Qing-Cai Chen","raw_affiliation_strings":["Department of Computer Science and Technology, Harbin Institute of Technology, Shenzhen, China","Department of Computer Science and Technology, Harbin Institute of Technology Shenzhen Graduate School, Shenzhen 518055, China#TAB#"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, Harbin Institute of Technology, Shenzhen, China","institution_ids":["https://openalex.org/I204983213"]},{"raw_affiliation_string":"Department of Computer Science and Technology, Harbin Institute of Technology Shenzhen Graduate School, Shenzhen 518055, China#TAB#","institution_ids":["https://openalex.org/I158809036","https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102206534","display_name":"Xiaohong Yang","orcid":null},"institutions":[{"id":"https://openalex.org/I158809036","display_name":"Shenzhen Institute of Information Technology","ror":"https://ror.org/03wrf9427","country_code":"CN","type":"education","lineage":["https://openalex.org/I158809036"]},{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiao-Hong Yang","raw_affiliation_strings":["Department of Computer Science and Technology, Harbin Institute of Technology, Shenzhen, China","Department of Computer Science and Technology, Harbin Institute of Technology Shenzhen Graduate School, Shenzhen 518055, China#TAB#"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, Harbin Institute of Technology, Shenzhen, China","institution_ids":["https://openalex.org/I204983213"]},{"raw_affiliation_string":"Department of Computer Science and Technology, Harbin Institute of Technology Shenzhen Graduate School, Shenzhen 518055, China#TAB#","institution_ids":["https://openalex.org/I158809036","https://openalex.org/I204983213"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100424254","display_name":"Xiaolong Wang","orcid":"https://orcid.org/0000-0001-9003-4252"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]},{"id":"https://openalex.org/I158809036","display_name":"Shenzhen Institute of Information Technology","ror":"https://ror.org/03wrf9427","country_code":"CN","type":"education","lineage":["https://openalex.org/I158809036"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiao-Long Wang","raw_affiliation_strings":["Department of Computer Science and Technology, Harbin Institute of Technology, Shenzhen, China","Department of Computer Science and Technology, Harbin Institute of Technology Shenzhen Graduate School, Shenzhen 518055, China#TAB#"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, Harbin Institute of Technology, Shenzhen, China","institution_ids":["https://openalex.org/I204983213"]},{"raw_affiliation_string":"Department of Computer Science and Technology, Harbin Institute of Technology Shenzhen Graduate School, Shenzhen 518055, China#TAB#","institution_ids":["https://openalex.org/I158809036","https://openalex.org/I204983213"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5110477928"],"corresponding_institution_ids":["https://openalex.org/I158809036","https://openalex.org/I204983213"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.17370078,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":93},"biblio":{"volume":null,"issue":null,"first_page":"1878","last_page":"1883"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9932000041007996,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10742","display_name":"Peer-to-Peer Network Technologies","score":0.9900000095367432,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/web-crawler","display_name":"Web crawler","score":0.9506456851959229},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.791975200176239},{"id":"https://openalex.org/keywords/focused-crawler","display_name":"Focused crawler","score":0.7753322124481201},{"id":"https://openalex.org/keywords/upload","display_name":"Upload","score":0.6881054043769836},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.6263978481292725},{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.59120774269104},{"id":"https://openalex.org/keywords/web-server","display_name":"Web server","score":0.5746637582778931},{"id":"https://openalex.org/keywords/crawling","display_name":"Crawling","score":0.5727197527885437},{"id":"https://openalex.org/keywords/web-page","display_name":"Web page","score":0.5534402132034302},{"id":"https://openalex.org/keywords/web-search-engine","display_name":"Web search engine","score":0.4952644407749176},{"id":"https://openalex.org/keywords/server","display_name":"Server","score":0.47813737392425537},{"id":"https://openalex.org/keywords/static-web-page","display_name":"Static web page","score":0.41224658489227295},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.3774062395095825},{"id":"https://openalex.org/keywords/the-internet","display_name":"The Internet","score":0.3665505647659302},{"id":"https://openalex.org/keywords/web-navigation","display_name":"Web navigation","score":0.28961554169654846}],"concepts":[{"id":"https://openalex.org/C13743948","wikidata":"https://www.wikidata.org/wiki/Q45842","display_name":"Web crawler","level":2,"score":0.9506456851959229},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.791975200176239},{"id":"https://openalex.org/C73340581","wikidata":"https://www.wikidata.org/wiki/Q5463958","display_name":"Focused crawler","level":5,"score":0.7753322124481201},{"id":"https://openalex.org/C71901391","wikidata":"https://www.wikidata.org/wiki/Q7126699","display_name":"Upload","level":2,"score":0.6881054043769836},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.6263978481292725},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.59120774269104},{"id":"https://openalex.org/C11392498","wikidata":"https://www.wikidata.org/wiki/Q11288","display_name":"Web server","level":3,"score":0.5746637582778931},{"id":"https://openalex.org/C100368936","wikidata":"https://www.wikidata.org/wiki/Q1411725","display_name":"Crawling","level":2,"score":0.5727197527885437},{"id":"https://openalex.org/C21959979","wikidata":"https://www.wikidata.org/wiki/Q36774","display_name":"Web page","level":2,"score":0.5534402132034302},{"id":"https://openalex.org/C521815418","wikidata":"https://www.wikidata.org/wiki/Q4182287","display_name":"Web search engine","level":4,"score":0.4952644407749176},{"id":"https://openalex.org/C93996380","wikidata":"https://www.wikidata.org/wiki/Q44127","display_name":"Server","level":2,"score":0.47813737392425537},{"id":"https://openalex.org/C173576120","wikidata":"https://www.wikidata.org/wiki/Q2641220","display_name":"Static web page","level":4,"score":0.41224658489227295},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.3774062395095825},{"id":"https://openalex.org/C110875604","wikidata":"https://www.wikidata.org/wiki/Q75","display_name":"The Internet","level":2,"score":0.3665505647659302},{"id":"https://openalex.org/C61096286","wikidata":"https://www.wikidata.org/wiki/Q7978592","display_name":"Web navigation","level":3,"score":0.28961554169654846},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.0},{"id":"https://openalex.org/C105702510","wikidata":"https://www.wikidata.org/wiki/Q514","display_name":"Anatomy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icmlc.2011.6016959","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icmlc.2011.6016959","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2011 International Conference on Machine Learning and Cybernetics","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure","score":0.5199999809265137}],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W75458008","https://openalex.org/W1566984846","https://openalex.org/W1613836731","https://openalex.org/W1674850363","https://openalex.org/W1761577731","https://openalex.org/W2007687650","https://openalex.org/W2029500199","https://openalex.org/W2038378248","https://openalex.org/W2045998703","https://openalex.org/W2066636486","https://openalex.org/W2098660810","https://openalex.org/W2130242957","https://openalex.org/W2145990704","https://openalex.org/W2158418010","https://openalex.org/W4285719527","https://openalex.org/W6634031162","https://openalex.org/W6638063638","https://openalex.org/W6679115375"],"related_works":["https://openalex.org/W2095543197","https://openalex.org/W2402678663","https://openalex.org/W3201526811","https://openalex.org/W4200125296","https://openalex.org/W2379145789","https://openalex.org/W1994958611","https://openalex.org/W2610451498","https://openalex.org/W2277785728","https://openalex.org/W2109463504","https://openalex.org/W3199173531"],"abstract_inverted_index":{"Though":[0],"the":[1,13,54,87,100,121,124,135,152,162,168,179,189,204],"commercial":[2],"success":[3],"of":[4,15,39,76,148,154,164,170,181],"search":[5,88],"engines":[6],"and":[7,29,80,90,102,111,178,187,201],"large":[8,21,172],"scale":[9],"web":[10,56,70,142,157],"page":[11,16],"crawlers,":[12,123],"problems":[14,52],"refresh,":[17],"new":[18],"URL":[19],"discovering,":[20],"file":[22],"downloading,":[23],"distributed":[24],"multimedia":[25,175],"content":[26,176],"feature":[27],"extracting":[28],"indexing":[30,186],"etc.":[31],"are":[32],"still":[33],"open.":[34],"The":[35,94,145],"independent":[36],"working":[37],"behavior":[38],"each":[40],"crawler":[41,57,78,82,95,117,136],"makes":[42],"it":[43],"very":[44],"hard":[45],"to":[46,99,109],"seek":[47],"solutions":[48],"for":[49,134,159,203],"all":[50],"these":[51,61],"under":[53],"classical":[55,122],"architecture.":[58],"To":[59],"address":[60],"problems,":[62],"this":[63,138,149],"paper":[64],"proposes":[65],"an":[66],"innovative":[67],"client/server":[68],"based":[69],"crawling":[71,143],"system.":[72,144],"This":[73],"system":[74,150,197],"consists":[75],"a":[77,81,105,131,140,160,195],"server":[79,96],"client":[83,101],"which":[84],"work":[85],"in":[86],"engine":[89],"website":[91,165],"end":[92],"respectively.":[93],"registers":[97],"itself":[98],"joins":[103],"into":[104],"temporary":[106],"peer-to-peer":[107],"network":[108],"cooperate":[110],"share":[112],"downloaded":[113],"data":[114,125],"with":[115],"other":[116],"servers.":[118],"Different":[119],"from":[120],"downloading":[126,171],"procedure":[127],"is":[128,139],"initialized":[129],"by":[130],"client.":[132],"So":[133],"server,":[137],"\u201cpassive\u201d":[141],"main":[146],"benefits":[147],"include":[151],"capability":[153,169,180],"timely":[155],"management":[156],"changes":[158],"crawler,":[161],"saving":[163],"bandwidth":[166],"resources,":[167],"files":[173],"or":[174],"features,":[177],"protection":[182],"intellectual":[183],"properties":[184],"while":[185],"searching":[188],"content.":[190],"Our":[191],"experiments":[192],"taken":[193],"on":[194],"simulation":[196],"show":[198],"its":[199],"efficiency":[200],"practicability":[202],"real":[205],"Internet":[206],"environments.":[207]},"counts_by_year":[{"year":2021,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
