{"id":"https://openalex.org/W2027019938","doi":"https://doi.org/10.1145/1670598.1670617","title":"Content and structure summarisation for accessing XML documents","display_name":"Content and structure summarisation for accessing XML documents","publication_year":2009,"publication_date":"2009-06-25","ids":{"openalex":"https://openalex.org/W2027019938","doi":"https://doi.org/10.1145/1670598.1670617","mag":"2027019938"},"language":"en","primary_location":{"id":"doi:10.1145/1670598.1670617","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1670598.1670617","pdf_url":null,"source":{"id":"https://openalex.org/S6756005","display_name":"ACM SIGIR Forum","issn_l":"0163-5840","issn":["0163-5840","1558-0229"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM SIGIR Forum","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5010729017","display_name":"Zolt\u00e1n Szl\u00e1vik","orcid":"https://orcid.org/0000-0002-2781-3795"},"institutions":[{"id":"https://openalex.org/I166337079","display_name":"Queen Mary University of London","ror":"https://ror.org/026zzn846","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I166337079"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Zolt\u00e1n Szl\u00e1vik","raw_affiliation_strings":["Queen Mary University of London, UK"],"affiliations":[{"raw_affiliation_string":"Queen Mary University of London, UK","institution_ids":["https://openalex.org/I166337079"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5010729017"],"corresponding_institution_ids":["https://openalex.org/I166337079"],"apc_list":null,"apc_paid":null,"fwci":0.901,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.80148966,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"43","issue":"1","first_page":"74","last_page":"74"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8864487409591675},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.8276610374450684},{"id":"https://openalex.org/keywords/document-structure-description","display_name":"Document Structure Description","score":0.8113530874252319},{"id":"https://openalex.org/keywords/well-formed-document","display_name":"Well-formed document","score":0.6154743432998657},{"id":"https://openalex.org/keywords/xml","display_name":"XML","score":0.5724737644195557},{"id":"https://openalex.org/keywords/document-retrieval","display_name":"Document retrieval","score":0.568572998046875},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5354360342025757},{"id":"https://openalex.org/keywords/document-type-definition","display_name":"Document type definition","score":0.5353617668151855},{"id":"https://openalex.org/keywords/xml-validation","display_name":"XML validation","score":0.4366023540496826},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.34872183203697205}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8864487409591675},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.8276610374450684},{"id":"https://openalex.org/C68699486","wikidata":"https://www.wikidata.org/wiki/Q265904","display_name":"Document Structure Description","level":3,"score":0.8113530874252319},{"id":"https://openalex.org/C137441365","wikidata":"https://www.wikidata.org/wiki/Q7981054","display_name":"Well-formed document","level":5,"score":0.6154743432998657},{"id":"https://openalex.org/C8797682","wikidata":"https://www.wikidata.org/wiki/Q2115","display_name":"XML","level":2,"score":0.5724737644195557},{"id":"https://openalex.org/C161156560","wikidata":"https://www.wikidata.org/wiki/Q1638872","display_name":"Document retrieval","level":2,"score":0.568572998046875},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5354360342025757},{"id":"https://openalex.org/C84314905","wikidata":"https://www.wikidata.org/wiki/Q212327","display_name":"Document type definition","level":4,"score":0.5353617668151855},{"id":"https://openalex.org/C55348073","wikidata":"https://www.wikidata.org/wiki/Q595926","display_name":"XML validation","level":3,"score":0.4366023540496826},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.34872183203697205},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/1670598.1670617","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1670598.1670617","pdf_url":null,"source":{"id":"https://openalex.org/S6756005","display_name":"ACM SIGIR Forum","issn_l":"0163-5840","issn":["0163-5840","1558-0229"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM SIGIR Forum","raw_type":"journal-article"},{"id":"pmh:hdl:10068/964204","is_oa":false,"landing_page_url":"http://hdl.handle.net/10068/964204","pdf_url":null,"source":{"id":"https://openalex.org/S4377196900","display_name":"OpenGrey (Institut de l'Information Scientifique et Technique)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1295345811","host_organization_name":"Institut de l'Information Scientifique et Technique","host_organization_lineage":["https://openalex.org/I1295345811"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"U - Thesis"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W200139865","https://openalex.org/W208548429","https://openalex.org/W1565039238","https://openalex.org/W1573514622","https://openalex.org/W1660390307","https://openalex.org/W1974035951","https://openalex.org/W1978255832","https://openalex.org/W2008427173","https://openalex.org/W2026642282","https://openalex.org/W2048987619","https://openalex.org/W2073562093","https://openalex.org/W2073722401","https://openalex.org/W2074011351","https://openalex.org/W2079896767","https://openalex.org/W2097221264","https://openalex.org/W2128089840","https://openalex.org/W2145827569","https://openalex.org/W2158291389","https://openalex.org/W2167260896","https://openalex.org/W2951028592","https://openalex.org/W3020974817"],"related_works":["https://openalex.org/W1562732971","https://openalex.org/W2495697035","https://openalex.org/W2293417074","https://openalex.org/W283628559","https://openalex.org/W2027019938","https://openalex.org/W1581124865","https://openalex.org/W2079058854","https://openalex.org/W2171917809","https://openalex.org/W2054593300","https://openalex.org/W1801801680"],"abstract_inverted_index":{"As":[0,147],"the":[1,41,52,60,71,99,103,117,183,189,198,264],"availability":[2],"of":[3,27,30,44,54,56,70,73,94,101,105,110,116,120,149,168,176,185,194,209,222,224,266],"structured":[4],"documents":[5,138,150],"is":[6,48,134,162,215,229,235,274],"constantly":[7],"increasing,":[8],"retrieval":[9,57,96],"systems":[10,58,97],"able":[11],"to":[12,50,67,78,91,154,165,180,263],"return":[13],"document":[14,31,45,63,80,106,121,140,145,159,169],"portions":[15,81,170],"are":[16,112,126,178,203,241],"being":[17],"developed.":[18],"Structured":[19],"documents,":[20,74],"usually":[21],"formatted":[22],"in":[23,75,82,98,128,157,171,182,212,256],"XML,":[24],"may":[25],"consist":[26],"large":[28],"numbers":[29],"portions,":[32,46,64,122],"often":[33],"organised":[34],"into":[35],"a":[36,89,129],"hierarchical":[37],"logical":[38],"structure.":[39],"With":[40],"high":[42],"number":[43],"it":[47,161],"necessary":[49],"direct":[51],"attention":[53],"users":[55],"towards":[59],"most":[61],"important":[62],"and":[65,231,268],"also,":[66],"give":[68],"overviews":[69],"structure":[72,217,227,245,251],"other":[76,186],"words,":[77],"show":[79],"context.":[83],"This":[84],"thesis":[85,214,258,273],"investigates":[86],"summarisation":[87,111,133,210,267],"as":[88,226],"means":[90],"help":[92],"searchers":[93,181],"XML":[95,124,172,270],"process":[100],"accessing":[102],"contents":[104,119],"portions.":[107,146],"Two":[108],"types":[109],"investigated.":[113],"First,":[114],"summaries":[115,148,167,193],"textual":[118,192],"called":[123,216],"elements,":[125],"studied":[127,236],"user-based":[130],"environment.":[131],"Traditionally,":[132],"associated":[135],"with":[136,144],"whole":[137,158],"or":[139,247],"sets,":[141],"but":[142],"rarely":[143],"have":[151],"been":[152],"proved":[153],"be":[155],"useful":[156],"retrieval,":[160],"considered":[163],"worthwhile":[164],"investigate":[166],"element":[173],"retrieval.":[174,271],"Summaries":[175],"elements":[177,187,195],"presented":[179,255],"context":[184],"from":[188],"document.":[190],"The":[191,206,219,253,272],"also":[196],"reflect":[197],"searchers'":[199,239],"information":[200],"needs:":[201],"they":[202],"query":[204],"based.":[205],"second":[207],"type":[208],"investigated":[211],"this":[213,257],"summarisation.":[218],"automatic":[220],"generation":[221,234],"tables":[223],"contents,":[225],"summaries,":[228],"described":[230],"examined.":[232],"ToC":[233],"either":[237],"when":[238],"queries":[240],"available":[242,275],"(query":[243,249],"based":[244],"summarisation)":[246],"otherwise":[248],"independent":[250],"summarisation).":[252],"work":[254],"has":[259],"made":[260],"several":[261],"contributions":[262],"fields":[265],"interactive":[269],"online":[276],"at":[277],"http://www.dcs.qmul.ac.uk/~zolley/thesis.html.":[278]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
