{"id":"https://openalex.org/W2141456009","doi":"https://doi.org/10.1145/2699442","title":"Document Spanners","display_name":"Document Spanners","publication_year":2015,"publication_date":"2015-05-06","ids":{"openalex":"https://openalex.org/W2141456009","doi":"https://doi.org/10.1145/2699442","mag":"2141456009"},"language":"en","primary_location":{"id":"doi:10.1145/2699442","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2699442","pdf_url":null,"source":{"id":"https://openalex.org/S118992489","display_name":"Journal of the ACM","issn_l":"0004-5411","issn":["0004-5411","1557-735X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of the ACM","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5027117465","display_name":"Ronald Fagin","orcid":"https://orcid.org/0000-0002-7374-0347"},"institutions":[{"id":"https://openalex.org/I4210085935","display_name":"IBM Research - Almaden","ror":"https://ror.org/005w8dd04","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210085935","https://openalex.org/I4210114115"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Ronald Fagin","raw_affiliation_strings":["IBM Research -- Almaden, San Jose, CA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IBM Research -- Almaden, San Jose, CA","institution_ids":["https://openalex.org/I4210085935"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006706357","display_name":"Benny Kimelfeld","orcid":"https://orcid.org/0000-0002-7156-1572"},"institutions":[{"id":"https://openalex.org/I4210085935","display_name":"IBM Research - Almaden","ror":"https://ror.org/005w8dd04","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210085935","https://openalex.org/I4210114115"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Benny Kimelfeld","raw_affiliation_strings":["IBM Research -- Almaden"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IBM Research -- Almaden","institution_ids":["https://openalex.org/I4210085935"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074416632","display_name":"Frederick Reiss","orcid":"https://orcid.org/0009-0002-1254-1798"},"institutions":[{"id":"https://openalex.org/I4210085935","display_name":"IBM Research - Almaden","ror":"https://ror.org/005w8dd04","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210085935","https://openalex.org/I4210114115"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Frederick Reiss","raw_affiliation_strings":["IBM Research -- Almaden, San Jose, CA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IBM Research -- Almaden, San Jose, CA","institution_ids":["https://openalex.org/I4210085935"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5022558461","display_name":"Stijn Vansummeren","orcid":"https://orcid.org/0000-0001-7793-9049"},"institutions":[{"id":"https://openalex.org/I132053463","display_name":"Universit\u00e9 Libre de Bruxelles","ror":"https://ror.org/01r9htc13","country_code":"BE","type":"education","lineage":["https://openalex.org/I132053463"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Stijn Vansummeren","raw_affiliation_strings":["Universit\u00e9 Libre de Bruxelles (ULB), Brussels, Belgium"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Universit\u00e9 Libre de Bruxelles (ULB), Brussels, Belgium","institution_ids":["https://openalex.org/I132053463"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5027117465"],"corresponding_institution_ids":["https://openalex.org/I4210085935"],"apc_list":null,"apc_paid":null,"fwci":9.3491,"has_fulltext":false,"cited_by_count":92,"citation_normalized_percentile":{"value":0.97845123,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":"62","issue":"2","first_page":"1","last_page":"51"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11567","display_name":"semigroups and automata theory","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/spanner","display_name":"Spanner","score":0.779596745967865},{"id":"https://openalex.org/keywords/complement","display_name":"Complement (music)","score":0.6049134731292725},{"id":"https://openalex.org/keywords/string","display_name":"String (physics)","score":0.5717154741287231},{"id":"https://openalex.org/keywords/regular-expression","display_name":"Regular expression","score":0.5631874799728394},{"id":"https://openalex.org/keywords/extension","display_name":"Extension (predicate logic)","score":0.5184202194213867},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4635573625564575},{"id":"https://openalex.org/keywords/algebraic-operation","display_name":"Algebraic operation","score":0.43670839071273804},{"id":"https://openalex.org/keywords/closure","display_name":"Closure (psychology)","score":0.43659812211990356},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.4333493113517761},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.42680680751800537},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.4187510013580322},{"id":"https://openalex.org/keywords/algebra-over-a-field","display_name":"Algebra over a field","score":0.3442921042442322},{"id":"https://openalex.org/keywords/algebraic-number","display_name":"Algebraic number","score":0.30047813057899475},{"id":"https://openalex.org/keywords/pure-mathematics","display_name":"Pure mathematics","score":0.12202656269073486},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.09555330872535706},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.09094473719596863}],"concepts":[{"id":"https://openalex.org/C2779585601","wikidata":"https://www.wikidata.org/wiki/Q4049850","display_name":"Spanner","level":2,"score":0.779596745967865},{"id":"https://openalex.org/C112313634","wikidata":"https://www.wikidata.org/wiki/Q7886648","display_name":"Complement (music)","level":5,"score":0.6049134731292725},{"id":"https://openalex.org/C157486923","wikidata":"https://www.wikidata.org/wiki/Q1376436","display_name":"String (physics)","level":2,"score":0.5717154741287231},{"id":"https://openalex.org/C121329065","wikidata":"https://www.wikidata.org/wiki/Q185612","display_name":"Regular expression","level":2,"score":0.5631874799728394},{"id":"https://openalex.org/C2778029271","wikidata":"https://www.wikidata.org/wiki/Q5421931","display_name":"Extension (predicate logic)","level":2,"score":0.5184202194213867},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4635573625564575},{"id":"https://openalex.org/C136003732","wikidata":"https://www.wikidata.org/wiki/Q3854337","display_name":"Algebraic operation","level":3,"score":0.43670839071273804},{"id":"https://openalex.org/C146834321","wikidata":"https://www.wikidata.org/wiki/Q2979672","display_name":"Closure (psychology)","level":2,"score":0.43659812211990356},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.4333493113517761},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.42680680751800537},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.4187510013580322},{"id":"https://openalex.org/C136119220","wikidata":"https://www.wikidata.org/wiki/Q1000660","display_name":"Algebra over a field","level":2,"score":0.3442921042442322},{"id":"https://openalex.org/C9376300","wikidata":"https://www.wikidata.org/wiki/Q168817","display_name":"Algebraic number","level":2,"score":0.30047813057899475},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.12202656269073486},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.09555330872535706},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.09094473719596863},{"id":"https://openalex.org/C37914503","wikidata":"https://www.wikidata.org/wiki/Q156495","display_name":"Mathematical physics","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C188082640","wikidata":"https://www.wikidata.org/wiki/Q1780899","display_name":"Complementation","level":4,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C34447519","wikidata":"https://www.wikidata.org/wiki/Q179522","display_name":"Market economy","level":1,"score":0.0},{"id":"https://openalex.org/C127716648","wikidata":"https://www.wikidata.org/wiki/Q104053","display_name":"Phenotype","level":3,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1145/2699442","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2699442","pdf_url":null,"source":{"id":"https://openalex.org/S118992489","display_name":"Journal of the ACM","issn_l":"0004-5411","issn":["0004-5411","1557-735X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of the ACM","raw_type":"journal-article"},{"id":"pmh:oai:dipot.ulb.ac.be:2013/200174","is_oa":false,"landing_page_url":"http://hdl.handle.net/2013/ULB-DIPOT:oai:dipot.ulb.ac.be:2013/200174","pdf_url":null,"source":{"id":"https://openalex.org/S4306401063","display_name":"D\u00e9p\u00f4t institutionnel de l'Universit\u00e9 libre de Bruxelles (Universit\u00e9 Libre de Bruxelles)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I132053463","host_organization_name":"Universit\u00e9 Libre de Bruxelles","host_organization_lineage":["https://openalex.org/I132053463"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Journal of the Association for Computing Machinery, 62 (2","raw_type":"info:ulb-repo/semantics/openurl/article"},{"id":"pmh:oai:documentserver.uhasselt.be:1942/33431","is_oa":false,"landing_page_url":"http://hdl.handle.net/1942/33431","pdf_url":null,"source":{"id":"https://openalex.org/S4306401926","display_name":"Document Server@UHasselt (UHasselt)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I878454856","host_organization_name":"Hasselt University","host_organization_lineage":["https://openalex.org/I878454856"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":54,"referenced_works":["https://openalex.org/W165164194","https://openalex.org/W1502749598","https://openalex.org/W1505482284","https://openalex.org/W1514152137","https://openalex.org/W1546515396","https://openalex.org/W1564013439","https://openalex.org/W1580943896","https://openalex.org/W1601674470","https://openalex.org/W1607983314","https://openalex.org/W1934019294","https://openalex.org/W1964071625","https://openalex.org/W1965306495","https://openalex.org/W1967693793","https://openalex.org/W1969595233","https://openalex.org/W1970599921","https://openalex.org/W1979960035","https://openalex.org/W1980622548","https://openalex.org/W1986891954","https://openalex.org/W1991958955","https://openalex.org/W1997520998","https://openalex.org/W1999563429","https://openalex.org/W2007245320","https://openalex.org/W2020437202","https://openalex.org/W2032874529","https://openalex.org/W2035266017","https://openalex.org/W2044652416","https://openalex.org/W2054693743","https://openalex.org/W2056865152","https://openalex.org/W2058241717","https://openalex.org/W2059501879","https://openalex.org/W2068882115","https://openalex.org/W2077518845","https://openalex.org/W2083735143","https://openalex.org/W2083909946","https://openalex.org/W2090567381","https://openalex.org/W2098720114","https://openalex.org/W2101571534","https://openalex.org/W2105590118","https://openalex.org/W2110367654","https://openalex.org/W2116548113","https://openalex.org/W2117657788","https://openalex.org/W2119422073","https://openalex.org/W2147880316","https://openalex.org/W2159133812","https://openalex.org/W2160133521","https://openalex.org/W2161484642","https://openalex.org/W2164949130","https://openalex.org/W2201604718","https://openalex.org/W2334129451","https://openalex.org/W2748837517","https://openalex.org/W2913383557","https://openalex.org/W3142621357","https://openalex.org/W4285719527","https://openalex.org/W6681868148"],"related_works":["https://openalex.org/W2949889395","https://openalex.org/W2162831161","https://openalex.org/W4297623464","https://openalex.org/W1549877447","https://openalex.org/W3125261964","https://openalex.org/W2181888227","https://openalex.org/W2032133070","https://openalex.org/W2502219810","https://openalex.org/W3190489747","https://openalex.org/W2141456009"],"abstract_inverted_index":{"An":[0],"intrinsic":[1],"part":[2],"of":[3,11,57,62,69,76,124,134,140,143,174,179,210],"information":[4],"extraction":[5],"is":[6,28,65,107,122],"the":[7,25,50,58,67,89,101,119,153,157,167,172,175,180,191,208,242],"creation":[8],"and":[9,212],"manipulation":[10],"relations":[12,86],"extracted":[13],"from":[14,88],"text.":[15],"In":[16],"this":[17,63],"article,":[18],"we":[19,30,218,235],"develop":[20],"a":[21,32,47,82],"foundational":[22],"framework":[23,106],"where":[24,118],"central":[26],"construct":[27],"what":[29],"call":[31],"document":[33],"spanner":[34,37,41,136],"(or":[35],"just":[36],"for":[38,115],"short).":[39],"A":[40],"maps":[42],"an":[43,95,111,216],"input":[44,90],"string":[45],"into":[46],"relation":[48],"over":[49],"spans":[51,147],"(intervals":[52],"specified":[53],"by":[54,109,138,194],"bounding":[55],"indices)":[56],"string.":[59],"The":[60,187],"focus":[61],"article":[64],"on":[66,207],"representation":[68,84,121],"spanners.":[70,104,214],"Conceptually,":[71],"there":[72],"are":[73,223,232],"two":[74,141],"kinds":[75,142],"such":[77],"representations.":[78],"Spanners":[79],"defined":[80,93],"in":[81,94,200,241],"primitive":[83,120,135],"extract":[85],"directly":[87],"string;":[91],"those":[92],"algebra":[96,173],"apply":[97],"algebraic":[98],"operations":[99],"to":[100,148],"primitively":[102],"represented":[103],"This":[105],"driven":[108],"SystemT,":[110],"IBM":[112],"commercial":[113],"product":[114],"text":[116],"analysis,":[117],"that":[123,145,152,220],"regular":[125,162,176,192,211,221],"expressions":[126,163],"with":[127,164,238],"capture":[128,165],"variables.":[129,149],"We":[130,150,202],"define":[131],"additional":[132],"types":[133],"representations":[137],"means":[139],"automata":[144],"assign":[146],"prove":[151,219],"first":[154,181],"kind":[155,169,182],"has":[156],"same":[158],"expressive":[159],"power":[160],"as":[161],"variables;":[166],"second":[168],"expresses":[170],"precisely":[171],"spanners\u2014the":[177],"closure":[178],"under":[183,225],"standard":[184],"relational":[185],"operators.":[186],"core":[188,213,230],"spanners":[189,222,231],"extend":[190],"ones":[193],"string-equality":[195],"selection":[196],"(an":[197],"extension":[198],"used":[199],"SystemT).":[201],"give":[203],"some":[204],"fundamental":[205],"results":[206],"expressiveness":[209],"As":[215],"example,":[217],"closed":[224],"difference":[226],"(and":[227],"complement),":[228],"but":[229],"not.":[233],"Finally,":[234],"establish":[236],"connections":[237],"related":[239],"notions":[240],"literature.":[243]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":11},{"year":2023,"cited_by_count":9},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":11},{"year":2020,"cited_by_count":16},{"year":2019,"cited_by_count":12},{"year":2018,"cited_by_count":10},{"year":2017,"cited_by_count":4},{"year":2016,"cited_by_count":6},{"year":2015,"cited_by_count":1}],"updated_date":"2026-05-29T09:21:14.243279","created_date":"2016-06-24T00:00:00"}
