{"id":"https://openalex.org/W4404130041","doi":"https://doi.org/10.1145/3695840","title":"Revisiting Weighted Information Extraction: A Simpler and Faster Algorithm for Ranked Enumeration","display_name":"Revisiting Weighted Information Extraction: A Simpler and Faster Algorithm for Ranked Enumeration","publication_year":2024,"publication_date":"2024-11-04","ids":{"openalex":"https://openalex.org/W4404130041","doi":"https://doi.org/10.1145/3695840"},"language":"en","primary_location":{"id":"doi:10.1145/3695840","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3695840","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3695840","source":{"id":"https://openalex.org/S4387289859","display_name":"Proceedings of the ACM on Management of Data","issn_l":"2836-6573","issn":["2836-6573"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Management of Data","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3695840","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5022706035","display_name":"Pawe\u0142 Gawrychowski","orcid":"https://orcid.org/0000-0002-6993-5440"},"institutions":[{"id":"https://openalex.org/I219388962","display_name":"University of Wroc\u0142aw","ror":"https://ror.org/00yae6e25","country_code":"PL","type":"education","lineage":["https://openalex.org/I219388962"]}],"countries":["PL"],"is_corresponding":true,"raw_author_name":"Pawe\u0142 Gawrychowski","raw_affiliation_strings":["University of Wroc\u0142aw, Wroc\u0142aw, Poland"],"affiliations":[{"raw_affiliation_string":"University of Wroc\u0142aw, Wroc\u0142aw, Poland","institution_ids":["https://openalex.org/I219388962"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006548981","display_name":"Flor\u00edn Manea","orcid":"https://orcid.org/0000-0001-6094-3324"},"institutions":[{"id":"https://openalex.org/I74656192","display_name":"University of G\u00f6ttingen","ror":"https://ror.org/01y9bpm73","country_code":"DE","type":"education","lineage":["https://openalex.org/I74656192"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Florin Manea","raw_affiliation_strings":["Computer Science Department and CIDAS, Universit\u00e4t G\u00f6ttingen, G\u00f6ttingen, Germany"],"affiliations":[{"raw_affiliation_string":"Computer Science Department and CIDAS, Universit\u00e4t G\u00f6ttingen, G\u00f6ttingen, Germany","institution_ids":["https://openalex.org/I74656192"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5038601790","display_name":"Markus L. Schmid","orcid":"https://orcid.org/0000-0001-5137-1504"},"institutions":[{"id":"https://openalex.org/I39343248","display_name":"Humboldt-Universit\u00e4t zu Berlin","ror":"https://ror.org/01hcx6992","country_code":"DE","type":"education","lineage":["https://openalex.org/I39343248"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Markus L. Schmid","raw_affiliation_strings":["Humboldt-Universit\u00e4t zu Berlin, Berlin, Germany"],"affiliations":[{"raw_affiliation_string":"Humboldt-Universit\u00e4t zu Berlin, Berlin, Germany","institution_ids":["https://openalex.org/I39343248"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5022706035"],"corresponding_institution_ids":["https://openalex.org/I219388962"],"apc_list":null,"apc_paid":null,"fwci":0.375,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.59262234,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"2","issue":"5","first_page":"1","last_page":"19"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/enumeration","display_name":"Enumeration","score":0.961430549621582},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.5419514775276184},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.499680757522583},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.4560425877571106},{"id":"https://openalex.org/keywords/extraction","display_name":"Extraction (chemistry)","score":0.42805033922195435},{"id":"https://openalex.org/keywords/combinatorics","display_name":"Combinatorics","score":0.20179447531700134},{"id":"https://openalex.org/keywords/chromatography","display_name":"Chromatography","score":0.08403593301773071}],"concepts":[{"id":"https://openalex.org/C156340839","wikidata":"https://www.wikidata.org/wiki/Q2704791","display_name":"Enumeration","level":2,"score":0.961430549621582},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.5419514775276184},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.499680757522583},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.4560425877571106},{"id":"https://openalex.org/C4725764","wikidata":"https://www.wikidata.org/wiki/Q844704","display_name":"Extraction (chemistry)","level":2,"score":0.42805033922195435},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.20179447531700134},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.08403593301773071},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3695840","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3695840","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3695840","source":{"id":"https://openalex.org/S4387289859","display_name":"Proceedings of the ACM on Management of Data","issn_l":"2836-6573","issn":["2836-6573"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Management of Data","raw_type":"journal-article"},{"id":"pmh:oai:publications.goettingen-research-online.de:2/153228","is_oa":true,"landing_page_url":"https://resolver.sub.uni-goettingen.de/purl?gro-2/153228","pdf_url":null,"source":{"id":"https://openalex.org/S4306401634","display_name":"GoeScholar  The Publication Server of the Georg-August-Universit\u00e4t G\u00f6ttingen (Georg-August-Universit\u00e4t G\u00f6ttingen)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210122495","host_organization_name":"Asklepios Klinik St. Georg","host_organization_lineage":["https://openalex.org/I4210122495"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"yes"}],"best_oa_location":{"id":"doi:10.1145/3695840","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3695840","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3695840","source":{"id":"https://openalex.org/S4387289859","display_name":"Proceedings of the ACM on Management of Data","issn_l":"2836-6573","issn":["2836-6573"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Management of Data","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G176652226","display_name":null,"funder_award_id":"466789228, 522576760","funder_id":"https://openalex.org/F4320320879","funder_display_name":"Deutsche Forschungsgemeinschaft"},{"id":"https://openalex.org/G6298832496","display_name":null,"funder_award_id":"2023/51/B/ST6/01505","funder_id":"https://openalex.org/F4320322511","funder_display_name":"Narodowe Centrum Nauki"}],"funders":[{"id":"https://openalex.org/F4320320879","display_name":"Deutsche Forschungsgemeinschaft","ror":"https://ror.org/018mejw64"},{"id":"https://openalex.org/F4320322511","display_name":"Narodowe Centrum Nauki","ror":"https://ror.org/03ha2q922"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4404130041.pdf"},"referenced_works_count":22,"referenced_works":["https://openalex.org/W1602103078","https://openalex.org/W1984816083","https://openalex.org/W2098755772","https://openalex.org/W2111340560","https://openalex.org/W2131058166","https://openalex.org/W2141456009","https://openalex.org/W2149710566","https://openalex.org/W2577865170","https://openalex.org/W2883227679","https://openalex.org/W2899702797","https://openalex.org/W2938252862","https://openalex.org/W2963265283","https://openalex.org/W3007878418","https://openalex.org/W3013294921","https://openalex.org/W3013397275","https://openalex.org/W3137215238","https://openalex.org/W3154082294","https://openalex.org/W3155438827","https://openalex.org/W4280619330","https://openalex.org/W4282827770","https://openalex.org/W4387323863","https://openalex.org/W6910307883"],"related_works":["https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W4391375266","https://openalex.org/W108845024","https://openalex.org/W2406961474","https://openalex.org/W4300125793","https://openalex.org/W2578985712","https://openalex.org/W2952598754","https://openalex.org/W3042106073","https://openalex.org/W2143566611"],"abstract_inverted_index":{"Information":[0],"extraction":[1],"from":[2,247],"textual":[3],"data,":[4],"where":[5,31,117],"the":[6,15,28,39,60,63,68,76,89,97,120,126,131,150,158,161,169,199,212],"query":[7],"is":[8,17,93,119,125],"represented":[9],"by":[10,47],"a":[11,36,178,186,218],"finite":[12],"transducer":[13],"and":[14,24,38,52,110,123,137,185,234,251],"task":[16],"to":[18,27,43,167,176,226],"enumerate":[19],"all":[20],"results":[21,171],"without":[22],"repetition,":[23],"its":[25],"extension":[26],"weighted":[29,132],"case,":[30,133],"each":[32],"output":[33,40,128,202],"element":[34,203],"has":[35],"weight":[37],"elements":[41],"are":[42,50],"be":[44,86,103],"enumerated":[45],"sorted":[46],"their":[48],"weights,":[49],"important":[51],"well":[53],"studied":[54],"problems":[55],"in":[56,88,96,114],"database":[57],"theory.":[58],"On":[59],"one":[61],"hand,":[62],"first":[64,164],"framework":[65],"already":[66],"covers":[67,79],"well-known":[69],"case":[70,99],"of":[71,152,160,188],"regular":[72],"document":[73],"spanners,":[74],"while":[75],"latter":[77],"setting":[78],"several":[80],"practically":[81],"relevant":[82],"tasks":[83],"that":[84,95,223],"cannot":[85],"described":[87],"unweighted":[90,98],"setting.":[91],"It":[92],"known":[94],"this":[100,242],"problem":[101],"can":[102],"solved":[104],"with":[105,145,182,230,238],"linear":[106,146,183,231,252],"time":[107,147,232],"preprocessing":[108,184,233],"O(|D|)":[109],"output-linear":[111,235],"delay":[112,151,187,236],"O(|s|)":[113,237],"data":[115,122,207],"complexity,":[116],"D":[118],"input":[121],"s":[124,204],"current":[127],"element.":[129],"For":[130],"Bourhis,":[134],"Grez,":[135],"Jachiet,":[136],"Riveros":[138],"[ICDT":[139],"2021]":[140],"recently":[141],"designed":[142],"an":[143,228],"algorithm":[144,181,229],"preprocessing,":[148],"but":[149],"O(|s|":[153],"\u00b7":[154],"log|D|)":[155],"depends":[156],"on":[157,172],"size":[159],"data.":[162],"We":[163],"show":[165],"how":[166],"leverage":[168],"existing":[170],"enumerating":[173],"shortest":[174],"paths":[175],"obtain":[177],"simple":[179],"alternative":[180],"O(|s":[189],"i":[190,200,205],"|":[191],"+":[192],"min\\":[193],"log":[194],"i,":[195],"log|D|":[196],")":[197],"for":[198],"th":[201],"(in":[206],"complexity);":[208],"thus,":[209],"substantially":[210],"improving":[211],"previous":[213],"algorithm.":[214],"Next,":[215],"we":[216,244],"develop":[217],"technically":[219],"involved":[220],"rounding":[221],"technique":[222],"allows":[224],"us":[225],"devise":[227],"high":[239],"probability.":[240],"To":[241],"end,":[243],"combine":[245],"tools":[246],"algebra,":[248],"high-dimensional":[249],"geometry,":[250],"programming.":[253]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
