{"id":"https://openalex.org/W2141384558","doi":"https://doi.org/10.1017/s0956796802004410","title":"Regular expression pattern matching for XML","display_name":"Regular expression pattern matching for XML","publication_year":2003,"publication_date":"2003-10-29","ids":{"openalex":"https://openalex.org/W2141384558","doi":"https://doi.org/10.1017/s0956796802004410","mag":"2141384558"},"language":"en","primary_location":{"id":"doi:10.1017/s0956796802004410","is_oa":true,"landing_page_url":"https://doi.org/10.1017/s0956796802004410","pdf_url":"https://www.cambridge.org/core/services/aop-cambridge-core/content/view/C845B41E6B150FBD7731EE396FBCB911/S0956796802004410a.pdf/div-class-title-regular-expression-pattern-matching-for-xml-div.pdf","source":{"id":"https://openalex.org/S12266929","display_name":"Journal of Functional Programming","issn_l":"0956-7968","issn":["0956-7968","1469-7653"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Functional Programming","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://www.cambridge.org/core/services/aop-cambridge-core/content/view/C845B41E6B150FBD7731EE396FBCB911/S0956796802004410a.pdf/div-class-title-regular-expression-pattern-matching-for-xml-div.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5025142030","display_name":"Haruo Hosoya","orcid":"https://orcid.org/0000-0002-5660-0801"},"institutions":[{"id":"https://openalex.org/I22299242","display_name":"Kyoto University","ror":"https://ror.org/02kpeqv85","country_code":"JP","type":"education","lineage":["https://openalex.org/I22299242"]},{"id":"https://openalex.org/I27429435","display_name":"Kyoto Institute of Technology","ror":"https://ror.org/00965ax52","country_code":"JP","type":"education","lineage":["https://openalex.org/I27429435"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"HARUO HOSOYA","raw_affiliation_strings":["Research Institute for Mathematical Sciences, Kyoto University, Sakyo-ku, Kyoto 606-8502, Japan (e-mail:","Research Institute for Mathematical Sciences, Kyoto University, Sakyo-ku, Kyoto 606-8502, Japan (e-mail: hahosoya@kurims.kyoto-u.ac.jp)"],"affiliations":[{"raw_affiliation_string":"Research Institute for Mathematical Sciences, Kyoto University, Sakyo-ku, Kyoto 606-8502, Japan (e-mail:","institution_ids":["https://openalex.org/I22299242","https://openalex.org/I27429435"]},{"raw_affiliation_string":"Research Institute for Mathematical Sciences, Kyoto University, Sakyo-ku, Kyoto 606-8502, Japan (e-mail: hahosoya@kurims.kyoto-u.ac.jp)","institution_ids":["https://openalex.org/I22299242"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5085361253","display_name":"Benjamin C. Pierce","orcid":"https://orcid.org/0000-0001-7839-1636"},"institutions":[{"id":"https://openalex.org/I79576946","display_name":"University of Pennsylvania","ror":"https://ror.org/00b30xv10","country_code":"US","type":"education","lineage":["https://openalex.org/I79576946"]},{"id":"https://openalex.org/I110357561","display_name":"University of the Sciences","ror":"https://ror.org/048gmay44","country_code":"US","type":"education","lineage":["https://openalex.org/I110357561"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"BENJAMIN C. PIERCE","raw_affiliation_strings":["Department of Computer and Information Science, University of Pennsylvania, 200 S. 33rd Street, Philadelphia, PA 19104-6389, USA (e-mail:","Department of Computer and Information Science, University of Pennsylvania, 200 S. 33rd Street, Philadelphia, PA 19104-6389, USA (e-mail: bcpierce@cis.upenn.edu)#TAB#"],"affiliations":[{"raw_affiliation_string":"Department of Computer and Information Science, University of Pennsylvania, 200 S. 33rd Street, Philadelphia, PA 19104-6389, USA (e-mail:","institution_ids":["https://openalex.org/I79576946","https://openalex.org/I110357561"]},{"raw_affiliation_string":"Department of Computer and Information Science, University of Pennsylvania, 200 S. 33rd Street, Philadelphia, PA 19104-6389, USA (e-mail: bcpierce@cis.upenn.edu)#TAB#","institution_ids":["https://openalex.org/I79576946"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5025142030"],"corresponding_institution_ids":["https://openalex.org/I22299242","https://openalex.org/I27429435"],"apc_list":null,"apc_paid":null,"fwci":15.99,"has_fulltext":true,"cited_by_count":76,"citation_normalized_percentile":{"value":0.99104131,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"13","issue":"6","first_page":"961","last_page":"1004"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10126","display_name":"Logic, programming, and type systems","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10126","display_name":"Logic, programming, and type systems","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/regular-expression","display_name":"Regular expression","score":0.9012283086776733},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8287686109542847},{"id":"https://openalex.org/keywords/pattern-matching","display_name":"Pattern matching","score":0.6411729454994202},{"id":"https://openalex.org/keywords/type-inference","display_name":"Type inference","score":0.5991965532302856},{"id":"https://openalex.org/keywords/automaton","display_name":"Automaton","score":0.5804711580276489},{"id":"https://openalex.org/keywords/xml","display_name":"XML","score":0.553446352481842},{"id":"https://openalex.org/keywords/expression","display_name":"Expression (computer science)","score":0.5345026254653931},{"id":"https://openalex.org/keywords/tree","display_name":"Tree (set theory)","score":0.5044595003128052},{"id":"https://openalex.org/keywords/alternation","display_name":"Alternation (linguistics)","score":0.4990384578704834},{"id":"https://openalex.org/keywords/redundancy","display_name":"Redundancy (engineering)","score":0.4961751401424408},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.464703232049942},{"id":"https://openalex.org/keywords/functional-programming","display_name":"Functional programming","score":0.46192994713783264},{"id":"https://openalex.org/keywords/data-structure","display_name":"Data structure","score":0.4106016457080841},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.39904412627220154},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.3855779767036438},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2870849668979645},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.13987678289413452}],"concepts":[{"id":"https://openalex.org/C121329065","wikidata":"https://www.wikidata.org/wiki/Q185612","display_name":"Regular expression","level":2,"score":0.9012283086776733},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8287686109542847},{"id":"https://openalex.org/C68859911","wikidata":"https://www.wikidata.org/wiki/Q1503724","display_name":"Pattern matching","level":2,"score":0.6411729454994202},{"id":"https://openalex.org/C198370458","wikidata":"https://www.wikidata.org/wiki/Q586459","display_name":"Type inference","level":3,"score":0.5991965532302856},{"id":"https://openalex.org/C112505250","wikidata":"https://www.wikidata.org/wiki/Q787116","display_name":"Automaton","level":2,"score":0.5804711580276489},{"id":"https://openalex.org/C8797682","wikidata":"https://www.wikidata.org/wiki/Q2115","display_name":"XML","level":2,"score":0.553446352481842},{"id":"https://openalex.org/C90559484","wikidata":"https://www.wikidata.org/wiki/Q778379","display_name":"Expression (computer science)","level":2,"score":0.5345026254653931},{"id":"https://openalex.org/C113174947","wikidata":"https://www.wikidata.org/wiki/Q2859736","display_name":"Tree (set theory)","level":2,"score":0.5044595003128052},{"id":"https://openalex.org/C26826806","wikidata":"https://www.wikidata.org/wiki/Q438358","display_name":"Alternation (linguistics)","level":2,"score":0.4990384578704834},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.4961751401424408},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.464703232049942},{"id":"https://openalex.org/C42383842","wikidata":"https://www.wikidata.org/wiki/Q193076","display_name":"Functional programming","level":2,"score":0.46192994713783264},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.4106016457080841},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.39904412627220154},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.3855779767036438},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2870849668979645},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.13987678289413452},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1017/s0956796802004410","is_oa":true,"landing_page_url":"https://doi.org/10.1017/s0956796802004410","pdf_url":"https://www.cambridge.org/core/services/aop-cambridge-core/content/view/C845B41E6B150FBD7731EE396FBCB911/S0956796802004410a.pdf/div-class-title-regular-expression-pattern-matching-for-xml-div.pdf","source":{"id":"https://openalex.org/S12266929","display_name":"Journal of Functional Programming","issn_l":"0956-7968","issn":["0956-7968","1469-7653"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Functional Programming","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1017/s0956796802004410","is_oa":true,"landing_page_url":"https://doi.org/10.1017/s0956796802004410","pdf_url":"https://www.cambridge.org/core/services/aop-cambridge-core/content/view/C845B41E6B150FBD7731EE396FBCB911/S0956796802004410a.pdf/div-class-title-regular-expression-pattern-matching-for-xml-div.pdf","source":{"id":"https://openalex.org/S12266929","display_name":"Journal of Functional Programming","issn_l":"0956-7968","issn":["0956-7968","1469-7653"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Functional Programming","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320309370","display_name":"University of Pennsylvania","ror":"https://ror.org/00b30xv10"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2141384558.pdf","grobid_xml":"https://content.openalex.org/works/W2141384558.grobid-xml"},"referenced_works_count":35,"referenced_works":["https://openalex.org/W33041674","https://openalex.org/W270849871","https://openalex.org/W1540080689","https://openalex.org/W1558109178","https://openalex.org/W1569254407","https://openalex.org/W1578467883","https://openalex.org/W1583633027","https://openalex.org/W1593569536","https://openalex.org/W1699388987","https://openalex.org/W1829244603","https://openalex.org/W1926956344","https://openalex.org/W1965014786","https://openalex.org/W1977793919","https://openalex.org/W1990483472","https://openalex.org/W1995362929","https://openalex.org/W2019789808","https://openalex.org/W2029764918","https://openalex.org/W2029791960","https://openalex.org/W2043687297","https://openalex.org/W2060876856","https://openalex.org/W2072137506","https://openalex.org/W2086130705","https://openalex.org/W2087060113","https://openalex.org/W2094945667","https://openalex.org/W2115587183","https://openalex.org/W2125252697","https://openalex.org/W2133654517","https://openalex.org/W2137946574","https://openalex.org/W2147125687","https://openalex.org/W2150750971","https://openalex.org/W2167998587","https://openalex.org/W4253003117","https://openalex.org/W4285719527","https://openalex.org/W4302339081","https://openalex.org/W6677073233"],"related_works":["https://openalex.org/W2031906380","https://openalex.org/W2056253254","https://openalex.org/W3140480875","https://openalex.org/W1975501418","https://openalex.org/W2131334283","https://openalex.org/W2166786469","https://openalex.org/W2141384558","https://openalex.org/W23186322","https://openalex.org/W3171422199","https://openalex.org/W2087271899"],"abstract_inverted_index":{"We":[0,16,59,177],"propose":[1],"regular":[2,25,89,126],"expression":[3,26,75,90],"pattern":[4,48,109],"matching":[5],"as":[6,29],"a":[7,46,56,100,183],"core":[8],"feature":[9],"of":[10,43,55,67,114,134,154,174],"programming":[11],"languages":[12,83],"for":[13,71],"manipulating":[14],"XML.":[15],"extend":[17],"conventional":[18],"pattern-matching":[19],"facilities":[20],"(as":[21],"in":[22,82,132],"ML)":[23],"with":[24,84,151,159],"operators":[27],"such":[28],"repetition":[30,155],"(*)":[31],",":[32,35],"alternation":[33,157],"(|)":[34],"etc.,":[36],"that":[37,104],"can":[38],"match":[39],"arbitrarily":[40],"long":[41],"sequences":[42],"subtrees,":[44],"allowing":[45],"compact":[47],"to":[49,63,79,108,166],"extract":[50],"data":[51,184],"from":[52,111],"the":[53,112,152,160,170,175],"middle":[54],"complex":[57],"sequence.":[58],"then":[60,130],"show":[61],"how":[62],"check":[64],"standard":[65,135],"notions":[66],"exhaustiveness":[68],"and":[69,123,129,140,156,172],"redundancy":[70],"these":[72,179,187],"patterns.":[73],"Regular":[74],"patterns":[76,124,158],"are":[77],"intended":[78],"be":[80],"used":[81],"type":[85,96,101,106,113,118],"systems":[86],"based":[87],"on":[88,142],"types":[91,122],".":[92],"To":[93],"avoid":[94],"excessive":[95],"annotations,":[97],"we":[98],"develop":[99],"inference":[102,119],"scheme":[103],"propagates":[105],"constraints":[107],"variables":[110],"input":[115],"values.":[116],"The":[117,145],"algorithm":[120],"translates":[121],"into":[125],"tree":[127,143],"automata,":[128],"works":[131],"terms":[133],"closure":[136,188],"operations":[137,189],"(union,":[138],"intersection,":[139],"difference)":[141],"automata.":[144],"main":[146],"technical":[147],"challenge":[148],"is":[149],"dealing":[150],"interaction":[153],"first-match":[161],"policy,":[162],"which":[163],"gives":[164],"rise":[165],"subtleties":[167],"concerning":[168],"both":[169],"termination":[171],"precision":[173],"analysis.":[176],"address":[178],"issues":[180],"by":[181],"introducing":[182],"structure":[185],"representing":[186],"lazily.":[190]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":2},{"year":2015,"cited_by_count":4},{"year":2014,"cited_by_count":6},{"year":2013,"cited_by_count":1},{"year":2012,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
