{"id":"https://openalex.org/W2289993248","doi":"https://doi.org/10.32657/10356/35745","title":"Mining evolution of structure of semi-structured web data","display_name":"Mining evolution of structure of semi-structured web data","publication_year":2007,"publication_date":"2007-01-01","ids":{"openalex":"https://openalex.org/W2289993248","doi":"https://doi.org/10.32657/10356/35745","mag":"2289993248"},"language":"en","primary_location":{"id":"doi:10.32657/10356/35745","is_oa":true,"landing_page_url":"https://doi.org/10.32657/10356/35745","pdf_url":"https://dr.ntu.edu.sg/bitstream/10356/35745/2/ZhaoQiankun07.pdf","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Nanyang Technological University","raw_type":"dissertation"},"type":"dissertation","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dr.ntu.edu.sg/bitstream/10356/35745/2/ZhaoQiankun07.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5075130969","display_name":"Qiankun Zhao","orcid":"https://orcid.org/0000-0001-7804-0430"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Qiankun Zhao","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5075130969"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9929999709129333,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9929999709129333,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9664999842643738,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9254000186920166,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4899093508720398},{"id":"https://openalex.org/keywords/semi-structured-data","display_name":"Semi-structured data","score":0.43898528814315796},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.43089744448661804},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.3883715271949768}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4899093508720398},{"id":"https://openalex.org/C40077939","wikidata":"https://www.wikidata.org/wiki/Q2336004","display_name":"Semi-structured data","level":3,"score":0.43898528814315796},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.43089744448661804},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3883715271949768},{"id":"https://openalex.org/C5655090","wikidata":"https://www.wikidata.org/wiki/Q192588","display_name":"Relational database","level":2,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.32657/10356/35745","is_oa":true,"landing_page_url":"https://doi.org/10.32657/10356/35745","pdf_url":"https://dr.ntu.edu.sg/bitstream/10356/35745/2/ZhaoQiankun07.pdf","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Nanyang Technological University","raw_type":"dissertation"},{"id":"pmh:oai:dr.ntu.edu.sg:10356/35745","is_oa":false,"landing_page_url":"https://hdl.handle.net/10356/35745","pdf_url":null,"source":{"id":"https://openalex.org/S4306402609","display_name":"DR-NTU (Nanyang Technological University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I172675005","host_organization_name":"Nanyang Technological University","host_organization_lineage":["https://openalex.org/I172675005"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Thesis"},{"id":"pmh:oai:uilis.unsyiah.ac.id:19435","is_oa":false,"landing_page_url":"http://hdl.handle.net/10356/35745","pdf_url":null,"source":{"id":"https://openalex.org/S4377196378","display_name":"UPT. Syiah Kuala University Library (Syiah Kuala University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I187494767","host_organization_name":"Universitas Syiah Kuala","host_organization_lineage":["https://openalex.org/I187494767"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Thesis"}],"best_oa_location":{"id":"doi:10.32657/10356/35745","is_oa":true,"landing_page_url":"https://doi.org/10.32657/10356/35745","pdf_url":"https://dr.ntu.edu.sg/bitstream/10356/35745/2/ZhaoQiankun07.pdf","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Nanyang Technological University","raw_type":"dissertation"},"sustainable_development_goals":[{"score":0.5400000214576721,"id":"https://metadata.un.org/sdg/8","display_name":"Decent work and economic growth"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2289993248.pdf","grobid_xml":"https://content.openalex.org/works/W2289993248.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052","https://openalex.org/W2529935843","https://openalex.org/W2005624112"],"abstract_inverted_index":{"Web":[0,32,39,52,69,81,98,106],"mining":[1,40,64],"is":[2,56,83],"a":[3],"converging":[4],"research":[5,9,26,59],"area":[6],"from":[7,105],"several":[8],"communities,":[10],"such":[11,91],"as":[12,92],"database,":[13],"information":[14],"retrieval,":[15],"machine":[16],"learning":[17],"and":[18,47,86,102],"natural":[19],"language":[20],"processing.":[21],"In":[22],"the":[23,45,48,65,77],"literature,":[24],"many":[25,89],"efforts":[27],"have":[28],"been":[29],"directed":[30],"to":[31],"mining.":[33],"However,":[34],"we":[35],"observed":[36],"that":[37,60,73],"existing":[38],"approaches":[41],"mainly":[42],"focused":[43],"on":[44],"semi-structured":[46],"massiveness":[49],"properties":[50],"of":[51,68,80],"data,":[53],"whereas":[54],"there":[55],"no":[57],"systematic":[58],"discovers":[61],"knowledge":[62,74],"by":[63],"dynamic":[66,78],"property":[67],"data.":[70,107],"We":[71],"believe":[72],"hidden":[75],"behind":[76],"nature":[79],"data":[82],"also":[84],"important":[85],"useful":[87],"in":[88],"applications":[90],"dynamic-conscious":[93],"XML":[94],"cache":[95],"strategy,":[96],"intelligent":[97],"advertisement":[99],"placing":[100],"scheme,":[101],"event":[103],"detection":[104]},"counts_by_year":[],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
