{"id":"https://openalex.org/W2157243877","doi":"https://doi.org/10.1109/icitst.2009.5402623","title":"The website census","display_name":"The website census","publication_year":2009,"publication_date":"2009-11-01","ids":{"openalex":"https://openalex.org/W2157243877","doi":"https://doi.org/10.1109/icitst.2009.5402623","mag":"2157243877"},"language":"en","primary_location":{"id":"doi:10.1109/icitst.2009.5402623","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icitst.2009.5402623","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2009 International Conference for Internet Technology and Secured Transactions, (ICITST)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5034136108","display_name":"Abdul Qadeer","orcid":"https://orcid.org/0000-0002-0268-1167"},"institutions":[{"id":"https://openalex.org/I142732210","display_name":"University of Engineering and Technology Lahore","ror":"https://ror.org/0051w2v06","country_code":"PK","type":"education","lineage":["https://openalex.org/I142732210"]}],"countries":["PK"],"is_corresponding":true,"raw_author_name":"A. Qadeer","raw_affiliation_strings":["Al-Khawarizmi Institute of Computer Science, University of Engineering and Technology, Lahore, Pakistan"],"affiliations":[{"raw_affiliation_string":"Al-Khawarizmi Institute of Computer Science, University of Engineering and Technology, Lahore, Pakistan","institution_ids":["https://openalex.org/I142732210"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101856571","display_name":"Waqar Mahmood","orcid":"https://orcid.org/0009-0001-6471-8420"},"institutions":[{"id":"https://openalex.org/I142732210","display_name":"University of Engineering and Technology Lahore","ror":"https://ror.org/0051w2v06","country_code":"PK","type":"education","lineage":["https://openalex.org/I142732210"]}],"countries":["PK"],"is_corresponding":false,"raw_author_name":"W. Mahmood","raw_affiliation_strings":["Al-Khawarizmi Institute of Computer Science, University of Engineering and Technology, Lahore, Pakistan"],"affiliations":[{"raw_affiliation_string":"Al-Khawarizmi Institute of Computer Science, University of Engineering and Technology, Lahore, Pakistan","institution_ids":["https://openalex.org/I142732210"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101836532","display_name":"Abdul Waheed","orcid":"https://orcid.org/0000-0001-9929-6574"},"institutions":[{"id":"https://openalex.org/I142732210","display_name":"University of Engineering and Technology Lahore","ror":"https://ror.org/0051w2v06","country_code":"PK","type":"education","lineage":["https://openalex.org/I142732210"]}],"countries":["PK"],"is_corresponding":false,"raw_author_name":"A. Waheed","raw_affiliation_strings":["Al-Khawarizmi Institute of Computer Science, University of Engineering and Technology, Lahore, Pakistan"],"affiliations":[{"raw_affiliation_string":"Al-Khawarizmi Institute of Computer Science, University of Engineering and Technology, Lahore, Pakistan","institution_ids":["https://openalex.org/I142732210"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5034136108"],"corresponding_institution_ids":["https://openalex.org/I142732210"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.17379804,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9800999760627747,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9550999999046326,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/crawling","display_name":"Crawling","score":0.9423107504844666},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7678365707397461},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.5926304459571838},{"id":"https://openalex.org/keywords/web-crawler","display_name":"Web crawler","score":0.5004804134368896},{"id":"https://openalex.org/keywords/web-page","display_name":"Web page","score":0.4537884593009949},{"id":"https://openalex.org/keywords/web-server","display_name":"Web server","score":0.4350751042366028},{"id":"https://openalex.org/keywords/bandwidth","display_name":"Bandwidth (computing)","score":0.4207325577735901},{"id":"https://openalex.org/keywords/resource","display_name":"Resource (disambiguation)","score":0.411689817905426},{"id":"https://openalex.org/keywords/the-internet","display_name":"The Internet","score":0.39156636595726013},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.15392065048217773}],"concepts":[{"id":"https://openalex.org/C100368936","wikidata":"https://www.wikidata.org/wiki/Q1411725","display_name":"Crawling","level":2,"score":0.9423107504844666},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7678365707397461},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.5926304459571838},{"id":"https://openalex.org/C13743948","wikidata":"https://www.wikidata.org/wiki/Q45842","display_name":"Web crawler","level":2,"score":0.5004804134368896},{"id":"https://openalex.org/C21959979","wikidata":"https://www.wikidata.org/wiki/Q36774","display_name":"Web page","level":2,"score":0.4537884593009949},{"id":"https://openalex.org/C11392498","wikidata":"https://www.wikidata.org/wiki/Q11288","display_name":"Web server","level":3,"score":0.4350751042366028},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.4207325577735901},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.411689817905426},{"id":"https://openalex.org/C110875604","wikidata":"https://www.wikidata.org/wiki/Q75","display_name":"The Internet","level":2,"score":0.39156636595726013},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.15392065048217773},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.0},{"id":"https://openalex.org/C105702510","wikidata":"https://www.wikidata.org/wiki/Q514","display_name":"Anatomy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icitst.2009.5402623","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icitst.2009.5402623","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2009 International Conference for Internet Technology and Secured Transactions, (ICITST)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":3,"referenced_works":["https://openalex.org/W2067117154","https://openalex.org/W2122269925","https://openalex.org/W2129620481"],"related_works":["https://openalex.org/W2566658409","https://openalex.org/W3119324922","https://openalex.org/W2352686120","https://openalex.org/W2372594123","https://openalex.org/W2358310581","https://openalex.org/W2964752624","https://openalex.org/W2026132847","https://openalex.org/W2137810919","https://openalex.org/W4385695127","https://openalex.org/W2097808084"],"abstract_inverted_index":{"The":[0,46,124],"website":[1,26],"census":[2],"is":[3,21,29,105,110,127],"an":[4],"effort":[5],"to":[6,90,128,134,142],"enumerate":[7],"all":[8],"the":[9,12,33,37,40,78,92,135],"websites":[10,120],"on":[11,98],"World":[13],"Wide":[14],"Web":[15],"(WWW)":[16],"without":[17],"using":[18],"crawling.":[19,137,155],"Crawling":[20],"a":[22,51,56,66,74,95,132,146],"traditional":[23],"way":[24],"of":[25,36,49,60,69,77,94,114,119],"discovery.":[27],"It":[28,138],"conceptually":[30],"simple":[31],"but":[32],"very":[34],"size":[35],"WWW":[38],"makes":[39],"implementation":[41],"complex":[42,67],"and":[43,65],"resource":[44,115],"demanding.":[45],"enormous":[47],"amount":[48],"bandwidth,":[50],"huge":[52],"persistent":[53],"storage":[54],"pool,":[55],"sufficiently":[57],"large":[58],"cluster":[59],"machines":[61],"for":[62,153],"data":[63],"processing":[64],"set":[68],"software":[70],"systems":[71],"are":[72],"just":[73],"few":[75],"examples":[76],"needed":[79],"resources.":[80],"In":[81],"this":[82,103],"work,":[83],"we":[84],"use":[85,129],"exhaustive":[86,106],"IP":[87],"range":[88],"probing":[89,104],"detect":[91],"presence":[93],"web":[96],"server":[97],"TCP":[99],"port":[100],"80.":[101],"Although":[102],"in":[107,112],"nature,":[108],"it":[109,130],"lightweight":[111],"terms":[113],"demands.":[116],"This":[117],"enumeration":[118],"has":[121],"many":[122],"applications.":[123],"most":[125],"obvious":[126],"as":[131,145],"seed":[133,152],"conventional":[136],"can":[139],"be":[140,143],"refined":[141],"used":[144],"top":[147],"level":[148],"domain":[149],"(TLD)":[150],"specific":[151],"targeted":[154]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2016-06-24T00:00:00"}
