{"id":"https://openalex.org/W4408197460","doi":"https://doi.org/10.1007/978-3-031-85960-1_9","title":"Web Crawl Refusals: Insights From Common Crawl","display_name":"Web Crawl Refusals: Insights From Common Crawl","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4408197460","doi":"https://doi.org/10.1007/978-3-031-85960-1_9"},"language":"en","primary_location":{"id":"doi:10.1007/978-3-031-85960-1_9","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-3-031-85960-1_9","pdf_url":null,"source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://research.utwente.nl/en/publications/bb2d7d75-9bd1-41d4-865e-c98a06cf5683","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5116539053","display_name":"Mostafa Ansar","orcid":null},"institutions":[{"id":"https://openalex.org/I94624287","display_name":"University of Twente","ror":"https://ror.org/006hf6230","country_code":"NL","type":"education","lineage":["https://openalex.org/I94624287"]}],"countries":["NL"],"is_corresponding":true,"raw_author_name":"Mostafa Ansar","raw_affiliation_strings":["University of Twente, Enschede, The Netherlands"],"affiliations":[{"raw_affiliation_string":"University of Twente, Enschede, The Netherlands","institution_ids":["https://openalex.org/I94624287"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025537461","display_name":"Anna Sperotto","orcid":"https://orcid.org/0000-0002-9481-5846"},"institutions":[{"id":"https://openalex.org/I94624287","display_name":"University of Twente","ror":"https://ror.org/006hf6230","country_code":"NL","type":"education","lineage":["https://openalex.org/I94624287"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Anna Sperotto","raw_affiliation_strings":["University of Twente, Enschede, The Netherlands"],"affiliations":[{"raw_affiliation_string":"University of Twente, Enschede, The Netherlands","institution_ids":["https://openalex.org/I94624287"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5005480813","display_name":"Ralph Holz","orcid":"https://orcid.org/0000-0001-9614-2377"},"institutions":[{"id":"https://openalex.org/I22465464","display_name":"University of M\u00fcnster","ror":"https://ror.org/00pd74e08","country_code":"DE","type":"education","lineage":["https://openalex.org/I22465464"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Ralph Holz","raw_affiliation_strings":["University of M\u00fcnster, M\u00fcnster, Germany"],"affiliations":[{"raw_affiliation_string":"University of M\u00fcnster, M\u00fcnster, Germany","institution_ids":["https://openalex.org/I22465464"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5116539053"],"corresponding_institution_ids":["https://openalex.org/I94624287"],"apc_list":{"value":5000,"currency":"EUR","value_usd":5392},"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.13610432,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"197","last_page":"214"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10400","display_name":"Network Security and Intrusion Detection","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10400","display_name":"Network Security and Intrusion Detection","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11598","display_name":"Internet Traffic Analysis and Secure E-voting","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8013643026351929},{"id":"https://openalex.org/keywords/web-crawler","display_name":"Web crawler","score":0.5135317444801331},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.4480663537979126},{"id":"https://openalex.org/keywords/web-application","display_name":"Web application","score":0.4180350601673126},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3756892681121826},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.359613835811615}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8013643026351929},{"id":"https://openalex.org/C13743948","wikidata":"https://www.wikidata.org/wiki/Q45842","display_name":"Web crawler","level":2,"score":0.5135317444801331},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.4480663537979126},{"id":"https://openalex.org/C118643609","wikidata":"https://www.wikidata.org/wiki/Q189210","display_name":"Web application","level":2,"score":0.4180350601673126},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3756892681121826},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.359613835811615}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1007/978-3-031-85960-1_9","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-3-031-85960-1_9","pdf_url":null,"source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},{"id":"pmh:oai:ris.utwente.nl:openaire/bb2d7d75-9bd1-41d4-865e-c98a06cf5683","is_oa":true,"landing_page_url":"https://research.utwente.nl/en/publications/bb2d7d75-9bd1-41d4-865e-c98a06cf5683","pdf_url":null,"source":{"id":"https://openalex.org/S4406922991","display_name":"University of Twente Research Information","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Ansar, M, Sperotto, A & Holz, R 2025, Web Crawl Refusals : Insights From Common Crawl. in C Testart, R van Rijswijk-Deij & B Stiller (eds), Passive and Active Measurement : 26th International Conference, PAM 2025, Virtual Event, March 10\u201312, 2025, Proceedings. Lecture Notes in Computer Science, vol. 15567, Springer, Cham, pp. 197\u2013214, 26th International Conference on Passive and Active Measurement, PAM 2025, Virtual, Online, 10/03/25. https://doi.org/10.1007/978-3-031-85960-1_9","raw_type":"info:eu-repo/semantics/publishedVersion"}],"best_oa_location":{"id":"pmh:oai:ris.utwente.nl:openaire/bb2d7d75-9bd1-41d4-865e-c98a06cf5683","is_oa":true,"landing_page_url":"https://research.utwente.nl/en/publications/bb2d7d75-9bd1-41d4-865e-c98a06cf5683","pdf_url":null,"source":{"id":"https://openalex.org/S4406922991","display_name":"University of Twente Research Information","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Ansar, M, Sperotto, A & Holz, R 2025, Web Crawl Refusals : Insights From Common Crawl. in C Testart, R van Rijswijk-Deij & B Stiller (eds), Passive and Active Measurement : 26th International Conference, PAM 2025, Virtual Event, March 10\u201312, 2025, Proceedings. Lecture Notes in Computer Science, vol. 15567, Springer, Cham, pp. 197\u2013214, 26th International Conference on Passive and Active Measurement, PAM 2025, Virtual, Online, 10/03/25. https://doi.org/10.1007/978-3-031-85960-1_9","raw_type":"info:eu-repo/semantics/publishedVersion"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities","score":0.5600000023841858}],"awards":[{"id":"https://openalex.org/G4002167081","display_name":null,"funder_award_id":"NWA.1215.18.003","funder_id":"https://openalex.org/F4320321800","funder_display_name":"Nederlandse Organisatie voor Wetenschappelijk Onderzoek"},{"id":"https://openalex.org/G629491556","display_name":null,"funder_award_id":"(NWO)","funder_id":"https://openalex.org/F4320321800","funder_display_name":"Nederlandse Organisatie voor Wetenschappelijk Onderzoek"}],"funders":[{"id":"https://openalex.org/F4320321800","display_name":"Nederlandse Organisatie voor Wetenschappelijk Onderzoek","ror":"https://ror.org/04jsz6e67"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W2130867912","https://openalex.org/W2144489971","https://openalex.org/W2184765589","https://openalex.org/W2424402128","https://openalex.org/W2796214649","https://openalex.org/W2902341081","https://openalex.org/W2955221586","https://openalex.org/W3004148183","https://openalex.org/W3012679427","https://openalex.org/W3015863761","https://openalex.org/W3093603548","https://openalex.org/W4256444741","https://openalex.org/W4281737183"],"related_works":["https://openalex.org/W2152505903","https://openalex.org/W2054759010","https://openalex.org/W3202833648","https://openalex.org/W2066301148","https://openalex.org/W2626977282","https://openalex.org/W2566625334","https://openalex.org/W2733224566","https://openalex.org/W3182846679","https://openalex.org/W2081888991","https://openalex.org/W3014696621"],"abstract_inverted_index":null,"counts_by_year":[],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
