{"id":"https://openalex.org/W2061743259","doi":"https://doi.org/10.1017/s1351324905004092","title":"Efficient dictionary-based text rewriting using subsequential transducers","display_name":"Efficient dictionary-based text rewriting using subsequential transducers","publication_year":2006,"publication_date":"2006-02-15","ids":{"openalex":"https://openalex.org/W2061743259","doi":"https://doi.org/10.1017/s1351324905004092","mag":"2061743259"},"language":"en","primary_location":{"id":"doi:10.1017/s1351324905004092","is_oa":false,"landing_page_url":"https://doi.org/10.1017/s1351324905004092","pdf_url":null,"source":{"id":"https://openalex.org/S18088403","display_name":"Natural Language Engineering","issn_l":"1351-3249","issn":["1351-3249","1469-8110"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Natural Language Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5114255303","display_name":"Stoyan Mihov","orcid":null},"institutions":[{"id":"https://openalex.org/I4210134980","display_name":"Institute for Parallel Processing","ror":"https://ror.org/047hhy227","country_code":"BG","type":"facility","lineage":["https://openalex.org/I24768866","https://openalex.org/I4210134980"]}],"countries":["BG"],"is_corresponding":true,"raw_author_name":"S. MIHOV","raw_affiliation_strings":["Institute for Parallel Processing, Bulgarian Academy of Sciences, Bulgaria e-mail:","Institute for parallel processing, bulgarian academy of sciences, bulgaria e-mail: stoyan@lml.bas.bg#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute for Parallel Processing, Bulgarian Academy of Sciences, Bulgaria e-mail:","institution_ids":["https://openalex.org/I4210134980"]},{"raw_affiliation_string":"Institute for parallel processing, bulgarian academy of sciences, bulgaria e-mail: stoyan@lml.bas.bg#TAB#","institution_ids":["https://openalex.org/I4210134980"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5109699155","display_name":"Klaus U. Schulz","orcid":null},"institutions":[{"id":"https://openalex.org/I174004417","display_name":"Munich University of Applied Sciences","ror":"https://ror.org/012k1v959","country_code":"DE","type":"education","lineage":["https://openalex.org/I174004417"]},{"id":"https://openalex.org/I8204097","display_name":"Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen","ror":"https://ror.org/05591te55","country_code":"DE","type":"education","lineage":["https://openalex.org/I8204097"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"K. U. SCHULZ","raw_affiliation_strings":["CIS, University of Munich, Munich, Germany e-mail:","Cis, university of munich, munich, germany e-mail: schulz@cis.uni-muenchen.de"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"CIS, University of Munich, Munich, Germany e-mail:","institution_ids":["https://openalex.org/I174004417"]},{"raw_affiliation_string":"Cis, university of munich, munich, germany e-mail: schulz@cis.uni-muenchen.de","institution_ids":["https://openalex.org/I8204097"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5114255303"],"corresponding_institution_ids":["https://openalex.org/I4210134980"],"apc_list":null,"apc_paid":null,"fwci":0.466,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.74208009,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"13","issue":"4","first_page":"353","last_page":"381"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11567","display_name":"semigroups and automata theory","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/rewriting","display_name":"Rewriting","score":0.9772204160690308},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7851639986038208},{"id":"https://openalex.org/keywords/string","display_name":"String (physics)","score":0.7467299699783325},{"id":"https://openalex.org/keywords/transducer","display_name":"Transducer","score":0.5081319808959961},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.45777082443237305},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.4547308385372162},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.2750076353549957},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.13164207339286804},{"id":"https://openalex.org/keywords/theoretical-physics","display_name":"Theoretical physics","score":0.05225035548210144}],"concepts":[{"id":"https://openalex.org/C154690210","wikidata":"https://www.wikidata.org/wiki/Q1668499","display_name":"Rewriting","level":2,"score":0.9772204160690308},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7851639986038208},{"id":"https://openalex.org/C157486923","wikidata":"https://www.wikidata.org/wiki/Q1376436","display_name":"String (physics)","level":2,"score":0.7467299699783325},{"id":"https://openalex.org/C56318395","wikidata":"https://www.wikidata.org/wiki/Q215928","display_name":"Transducer","level":2,"score":0.5081319808959961},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.45777082443237305},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4547308385372162},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.2750076353549957},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.13164207339286804},{"id":"https://openalex.org/C33332235","wikidata":"https://www.wikidata.org/wiki/Q18362","display_name":"Theoretical physics","level":1,"score":0.05225035548210144},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1017/s1351324905004092","is_oa":false,"landing_page_url":"https://doi.org/10.1017/s1351324905004092","pdf_url":null,"source":{"id":"https://openalex.org/S18088403","display_name":"Natural Language Engineering","issn_l":"1351-3249","issn":["1351-3249","1469-8110"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Natural Language Engineering","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.6499999761581421,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":42,"referenced_works":["https://openalex.org/W1500492658","https://openalex.org/W1513168562","https://openalex.org/W1548701969","https://openalex.org/W1556847696","https://openalex.org/W1563342424","https://openalex.org/W1602846073","https://openalex.org/W1606377818","https://openalex.org/W1860547055","https://openalex.org/W2002089154","https://openalex.org/W2002785199","https://openalex.org/W2007624857","https://openalex.org/W2010595692","https://openalex.org/W2021833629","https://openalex.org/W2032898343","https://openalex.org/W2035967403","https://openalex.org/W2058200372","https://openalex.org/W2081687495","https://openalex.org/W2082713237","https://openalex.org/W2093476618","https://openalex.org/W2098162425","https://openalex.org/W2099964107","https://openalex.org/W2100000146","https://openalex.org/W2100716182","https://openalex.org/W2100796029","https://openalex.org/W2125529971","https://openalex.org/W2142268730","https://openalex.org/W2143173740","https://openalex.org/W2154478838","https://openalex.org/W2170706044","https://openalex.org/W2296035094","https://openalex.org/W2753176400","https://openalex.org/W2950053197","https://openalex.org/W2951009239","https://openalex.org/W3009586891","https://openalex.org/W4245608667","https://openalex.org/W4249958171","https://openalex.org/W4252090733","https://openalex.org/W4299138792","https://openalex.org/W4302339081","https://openalex.org/W6630740198","https://openalex.org/W6678720029","https://openalex.org/W6680966335"],"related_works":["https://openalex.org/W2120204135","https://openalex.org/W1796293478","https://openalex.org/W174435416","https://openalex.org/W2168276503","https://openalex.org/W2139396251","https://openalex.org/W4302964898","https://openalex.org/W1805991041","https://openalex.org/W90089155","https://openalex.org/W2343223407","https://openalex.org/W1851409572"],"abstract_inverted_index":{"Abstract":[0],"Problems":[1],"in":[2,76,134,154,158,205],"the":[3,111,116,130,135,138,142,170,175,189],"area":[4],"of":[5,32,47,67,81,137,147],"text":[6,15,26,71,79,105,145],"and":[7,55,109],"document":[8],"processing":[9,208],"can":[10,191],"often":[11],"be":[12,192],"described":[13],"as":[14,107],"rewriting":[16,33,40,60,72,95,113,177,203],"tasks":[17,204],":":[18],"given":[19,43,93],"an":[20,77,88],"input":[21,78,108,139],"text,":[22],"produce":[23],"a":[24,39,45,50,59,64,94,99,155,183,206],"new":[25],"by":[27,44,83],"applying":[28],"some":[29],"fixed":[30],"set":[31],"rules.":[34],"In":[35],"its":[36,56],"simplest":[37],"form,":[38],"rule":[41],"is":[42,132,152,179],"pair":[46],"strings,":[48],"representing":[49],"source":[51],"string":[52],"(the":[53],"\u201coriginal\u201d)":[54],"substitute.":[57],"By":[58],"dictionary,":[61],"we":[62],"mean":[63],"finite":[65],"list":[66],"such":[68],"pairs;":[69],"dictionary-based":[70],"means":[73],"to":[74,128,198],"replace":[75],"occurrences":[80],"originals":[82],"their":[84],"substitutes.":[85],"We":[86],"present":[87],"efficient":[89],"method":[90],"for":[91],"constructing,":[92],"dictionary":[96],"D":[97],",":[98],"subsequential":[100],"transducer":[101,131,190],"that":[102],"accepts":[103],"any":[104,144],"t":[106,123,146,150,162,164,167],"outputs":[110],"intended":[112],"result":[114],"under":[115],"so-called":[117],"\u201cleftmost-longest":[118],"match\u201d":[119],"replacement":[120],"with":[121,195],"skips,":[122],"'.":[124],"The":[125],"time":[126,159],"needed":[127],"compute":[129],"linear":[133],"size":[136],"dictionary.":[140],"Given":[141],"transducer,":[143],"length":[148],"|":[149,151],"rewritten":[153],"deterministic":[156],"manner":[157],"O":[160],"(|":[161],"|+|":[163],"'|),":[165],"where":[166],"'":[168],"denotes":[169],"resulting":[171,176],"output":[172],"text.":[173],"Hence":[174],"mechanism":[178],"very":[180],"efficient.":[181],"As":[182],"second":[184],"advantage,":[185],"using":[186],"standard":[187],"tools,":[188],"directly":[193],"composed":[194],"other":[196],"transducers":[197],"efficiently":[199],"solve":[200],"more":[201],"complex":[202],"single":[207],"step.":[209]},"counts_by_year":[{"year":2017,"cited_by_count":1},{"year":2014,"cited_by_count":1},{"year":2013,"cited_by_count":1}],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
