{"id":"https://openalex.org/W4387850605","doi":"https://doi.org/10.1007/978-981-99-7254-8_25","title":"Web Page Segmentation: A DOM-Structural Cohesion Analysis Approach","display_name":"Web Page Segmentation: A DOM-Structural Cohesion Analysis Approach","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4387850605","doi":"https://doi.org/10.1007/978-981-99-7254-8_25"},"language":"en","primary_location":{"id":"doi:10.1007/978-981-99-7254-8_25","is_oa":true,"landing_page_url":"https://doi.org/10.1007/978-981-99-7254-8_25","pdf_url":"https://link.springer.com/content/pdf/10.1007/978-981-99-7254-8_25.pdf","source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://link.springer.com/content/pdf/10.1007/978-981-99-7254-8_25.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5008434740","display_name":"Hieu Huynh","orcid":"https://orcid.org/0000-0003-2310-1376"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Minh-Hieu Huynh","raw_affiliation_strings":["Katalon Inc., Ho Chi Minh City, Vietnam"],"affiliations":[{"raw_affiliation_string":"Katalon Inc., Ho Chi Minh City, Vietnam","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102570410","display_name":"Quoc-Tri Le","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Quoc-Tri Le","raw_affiliation_strings":["Katalon Inc., Ho Chi Minh City, Vietnam"],"affiliations":[{"raw_affiliation_string":"Katalon Inc., Ho Chi Minh City, Vietnam","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055078097","display_name":"Loc Nguyen","orcid":"https://orcid.org/0000-0001-5192-8106"},"institutions":[{"id":"https://openalex.org/I123565023","display_name":"Vietnam National University Ho Chi Minh City","ror":"https://ror.org/00waaqh38","country_code":"VN","type":"education","lineage":["https://openalex.org/I123565023"]},{"id":"https://openalex.org/I23582244","display_name":"Ho Chi Minh City University of Science","ror":"https://ror.org/05jfbgm49","country_code":"VN","type":"education","lineage":["https://openalex.org/I123565023","https://openalex.org/I23582244"]}],"countries":["VN"],"is_corresponding":false,"raw_author_name":"Vu Nguyen","raw_affiliation_strings":["Katalon Inc., Ho Chi Minh City, Vietnam","University of Science, Ho Chi Minh City, Vietnam","Vietnam National University, Ho Chi Minh City, Vietnam"],"affiliations":[{"raw_affiliation_string":"Katalon Inc., Ho Chi Minh City, Vietnam","institution_ids":[]},{"raw_affiliation_string":"University of Science, Ho Chi Minh City, Vietnam","institution_ids":["https://openalex.org/I23582244"]},{"raw_affiliation_string":"Vietnam National University, Ho Chi Minh City, Vietnam","institution_ids":["https://openalex.org/I123565023"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100709067","display_name":"Tien Nguyen","orcid":"https://orcid.org/0000-0002-4016-9164"},"institutions":[{"id":"https://openalex.org/I162577319","display_name":"The University of Texas at Dallas","ror":"https://ror.org/049emcs32","country_code":"US","type":"education","lineage":["https://openalex.org/I162577319"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Tien Nguyen","raw_affiliation_strings":["Katalon Inc., Ho Chi Minh City, Vietnam","University of Texas at Dallas, Richardson, TX, USA"],"affiliations":[{"raw_affiliation_string":"Katalon Inc., Ho Chi Minh City, Vietnam","institution_ids":[]},{"raw_affiliation_string":"University of Texas at Dallas, Richardson, TX, USA","institution_ids":["https://openalex.org/I162577319"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5008434740"],"corresponding_institution_ids":[],"apc_list":{"value":5000,"currency":"EUR","value_usd":5392},"apc_paid":null,"fwci":1.499,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.84805299,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"319","last_page":"333"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9708999991416931,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9139000177383423,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8646701574325562},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.7911025285720825},{"id":"https://openalex.org/keywords/document-object-model","display_name":"Document Object Model","score":0.7276743054389954},{"id":"https://openalex.org/keywords/crawling","display_name":"Crawling","score":0.6295297145843506},{"id":"https://openalex.org/keywords/cohesion","display_name":"Cohesion (chemistry)","score":0.6278641223907471},{"id":"https://openalex.org/keywords/web-page","display_name":"Web page","score":0.6056965589523315},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5366560816764832},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.38739630579948425},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3861621916294098},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.34192854166030884},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.22464877367019653}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8646701574325562},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.7911025285720825},{"id":"https://openalex.org/C137922610","wikidata":"https://www.wikidata.org/wiki/Q2093","display_name":"Document Object Model","level":3,"score":0.7276743054389954},{"id":"https://openalex.org/C100368936","wikidata":"https://www.wikidata.org/wiki/Q1411725","display_name":"Crawling","level":2,"score":0.6295297145843506},{"id":"https://openalex.org/C104054115","wikidata":"https://www.wikidata.org/wiki/Q216828","display_name":"Cohesion (chemistry)","level":2,"score":0.6278641223907471},{"id":"https://openalex.org/C21959979","wikidata":"https://www.wikidata.org/wiki/Q36774","display_name":"Web page","level":2,"score":0.6056965589523315},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5366560816764832},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.38739630579948425},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3861621916294098},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.34192854166030884},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.22464877367019653},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C105702510","wikidata":"https://www.wikidata.org/wiki/Q514","display_name":"Anatomy","level":1,"score":0.0},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/978-981-99-7254-8_25","is_oa":true,"landing_page_url":"https://doi.org/10.1007/978-981-99-7254-8_25","pdf_url":"https://link.springer.com/content/pdf/10.1007/978-981-99-7254-8_25.pdf","source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"}],"best_oa_location":{"id":"doi:10.1007/978-981-99-7254-8_25","is_oa":true,"landing_page_url":"https://doi.org/10.1007/978-981-99-7254-8_25","pdf_url":"https://link.springer.com/content/pdf/10.1007/978-981-99-7254-8_25.pdf","source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4387850605.pdf","grobid_xml":"https://content.openalex.org/works/W4387850605.grobid-xml"},"referenced_works_count":25,"referenced_works":["https://openalex.org/W1566513354","https://openalex.org/W1965704641","https://openalex.org/W1989338554","https://openalex.org/W2004779840","https://openalex.org/W2020254000","https://openalex.org/W2040075907","https://openalex.org/W2072489225","https://openalex.org/W2084358158","https://openalex.org/W2093436348","https://openalex.org/W2095289676","https://openalex.org/W2100184871","https://openalex.org/W2127847352","https://openalex.org/W2145023731","https://openalex.org/W2145349611","https://openalex.org/W2152818382","https://openalex.org/W2400661088","https://openalex.org/W2493109812","https://openalex.org/W2785494106","https://openalex.org/W2957505564","https://openalex.org/W2963849369","https://openalex.org/W3094448412","https://openalex.org/W3142760838","https://openalex.org/W3210529140","https://openalex.org/W4206845400","https://openalex.org/W4241588219"],"related_works":["https://openalex.org/W4385695127","https://openalex.org/W2031790754","https://openalex.org/W2373402338","https://openalex.org/W3144508074","https://openalex.org/W2951920527","https://openalex.org/W2076910790","https://openalex.org/W2155199173","https://openalex.org/W2275993472","https://openalex.org/W2998827288","https://openalex.org/W43181213"],"abstract_inverted_index":null,"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-25T14:56:36.534964","created_date":"2025-10-10T00:00:00"}
