{"id":"https://openalex.org/W151043533","doi":"https://doi.org/10.1007/978-3-642-33308-8_4","title":"Generating Xpath Expressions for Structured Web Data Record Segmentation","display_name":"Generating Xpath Expressions for Structured Web Data Record Segmentation","publication_year":2012,"publication_date":"2012-01-01","ids":{"openalex":"https://openalex.org/W151043533","doi":"https://doi.org/10.1007/978-3-642-33308-8_4","mag":"151043533"},"language":"en","primary_location":{"id":"doi:10.1007/978-3-642-33308-8_4","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-3-642-33308-8_4","pdf_url":null,"source":{"id":"https://openalex.org/S2764900261","display_name":"Communications in computer and information science","issn_l":"1865-0929","issn":["1865-0929","1865-0937"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Communications in Computer and Information Science","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5064548188","display_name":"Tomas Grigalis","orcid":null},"institutions":[{"id":"https://openalex.org/I167420956","display_name":"Vilnius Gediminas Technical University","ror":"https://ror.org/02x3e4q36","country_code":"LT","type":"education","lineage":["https://openalex.org/I167420956"]}],"countries":["LT"],"is_corresponding":true,"raw_author_name":"Tomas Grigalis","raw_affiliation_strings":["Department of Information Systems, Vilnius Gediminas Technical University, Vilnius, Lithuania"],"affiliations":[{"raw_affiliation_string":"Department of Information Systems, Vilnius Gediminas Technical University, Vilnius, Lithuania","institution_ids":["https://openalex.org/I167420956"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5062980566","display_name":"Antanas \u010cenys","orcid":"https://orcid.org/0000-0002-0208-7176"},"institutions":[{"id":"https://openalex.org/I167420956","display_name":"Vilnius Gediminas Technical University","ror":"https://ror.org/02x3e4q36","country_code":"LT","type":"education","lineage":["https://openalex.org/I167420956"]}],"countries":["LT"],"is_corresponding":false,"raw_author_name":"Antanas \u010cenys","raw_affiliation_strings":["Department of Information Systems, Vilnius Gediminas Technical University, Vilnius, Lithuania"],"affiliations":[{"raw_affiliation_string":"Department of Information Systems, Vilnius Gediminas Technical University, Vilnius, Lithuania","institution_ids":["https://openalex.org/I167420956"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5064548188"],"corresponding_institution_ids":["https://openalex.org/I167420956"],"apc_list":null,"apc_paid":null,"fwci":0.6088,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.67246587,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"38","last_page":"47"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9847999811172485,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13976","display_name":"Web visibility and informetrics","score":0.9562000036239624,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8296995162963867},{"id":"https://openalex.org/keywords/xpath","display_name":"XPath","score":0.7690829038619995},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.6526810526847839},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.6344648003578186},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.5635611414909363},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5572190284729004},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.46154123544692993},{"id":"https://openalex.org/keywords/web-page","display_name":"Web page","score":0.4554755687713623},{"id":"https://openalex.org/keywords/precision-and-recall","display_name":"Precision and recall","score":0.4258367717266083},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.41377830505371094},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2755866050720215},{"id":"https://openalex.org/keywords/xml","display_name":"XML","score":0.243859201669693},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.20300549268722534},{"id":"https://openalex.org/keywords/xml-database","display_name":"XML database","score":0.07570019364356995}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8296995162963867},{"id":"https://openalex.org/C2780213375","wikidata":"https://www.wikidata.org/wiki/Q16340","display_name":"XPath","level":4,"score":0.7690829038619995},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.6526810526847839},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.6344648003578186},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.5635611414909363},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5572190284729004},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.46154123544692993},{"id":"https://openalex.org/C21959979","wikidata":"https://www.wikidata.org/wiki/Q36774","display_name":"Web page","level":2,"score":0.4554755687713623},{"id":"https://openalex.org/C81669768","wikidata":"https://www.wikidata.org/wiki/Q2359161","display_name":"Precision and recall","level":2,"score":0.4258367717266083},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.41377830505371094},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2755866050720215},{"id":"https://openalex.org/C8797682","wikidata":"https://www.wikidata.org/wiki/Q2115","display_name":"XML","level":2,"score":0.243859201669693},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.20300549268722534},{"id":"https://openalex.org/C183068750","wikidata":"https://www.wikidata.org/wiki/Q357393","display_name":"XML database","level":3,"score":0.07570019364356995},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/978-3-642-33308-8_4","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-3-642-33308-8_4","pdf_url":null,"source":{"id":"https://openalex.org/S2764900261","display_name":"Communications in computer and information science","issn_l":"1865-0929","issn":["1865-0929","1865-0937"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Communications in Computer and Information Science","raw_type":"book-chapter"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W104909239","https://openalex.org/W1553019137","https://openalex.org/W1803802947","https://openalex.org/W2022158118","https://openalex.org/W2040757233","https://openalex.org/W2049461910","https://openalex.org/W2104086170","https://openalex.org/W2108223890","https://openalex.org/W2128341918","https://openalex.org/W2139599797","https://openalex.org/W2143309843","https://openalex.org/W2148210463","https://openalex.org/W2157160236","https://openalex.org/W2160189941","https://openalex.org/W2247412337","https://openalex.org/W4230980612","https://openalex.org/W4239866631","https://openalex.org/W4285719527"],"related_works":["https://openalex.org/W1542110834","https://openalex.org/W2611888112","https://openalex.org/W2121120069","https://openalex.org/W562932586","https://openalex.org/W2124793519","https://openalex.org/W2398280235","https://openalex.org/W2184735843","https://openalex.org/W2355446901","https://openalex.org/W1994081385","https://openalex.org/W2072289174"],"abstract_inverted_index":null,"counts_by_year":[{"year":2013,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
