{"id":"https://openalex.org/W4408105704","doi":"https://doi.org/10.1162/tacl_a_00736","title":"Transformers as Transducers","display_name":"Transformers as Transducers","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4408105704","doi":"https://doi.org/10.1162/tacl_a_00736"},"language":"en","primary_location":{"id":"doi:10.1162/tacl_a_00736","is_oa":true,"landing_page_url":"https://doi.org/10.1162/tacl_a_00736","pdf_url":"https://direct.mit.edu/tacl/article-pdf/doi/10.1162/tacl_a_00736/2506494/tacl_a_00736.pdf","source":{"id":"https://openalex.org/S2729999759","display_name":"Transactions of the Association for Computational Linguistics","issn_l":"2307-387X","issn":["2307-387X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Transactions of the Association for Computational Linguistics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://direct.mit.edu/tacl/article-pdf/doi/10.1162/tacl_a_00736/2506494/tacl_a_00736.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5092616543","display_name":"Lena Strobl","orcid":null},"institutions":[{"id":"https://openalex.org/I90267481","display_name":"Ume\u00e5 University","ror":"https://ror.org/05kb8h459","country_code":"SE","type":"education","lineage":["https://openalex.org/I90267481"]}],"countries":["SE"],"is_corresponding":true,"raw_author_name":"Lena Strobl","raw_affiliation_strings":["Ume\u00e5 University, Sweden. lena.strobl@umu.se"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Ume\u00e5 University, Sweden. lena.strobl@umu.se","institution_ids":["https://openalex.org/I90267481"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022630792","display_name":"Dana Angluin","orcid":"https://orcid.org/0000-0002-6907-2999"},"institutions":[{"id":"https://openalex.org/I32971472","display_name":"Yale University","ror":"https://ror.org/03v76x132","country_code":"US","type":"education","lineage":["https://openalex.org/I32971472"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dana Angluin","raw_affiliation_strings":["Yale University, USA. dana.angluin@yale.edu"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Yale University, USA. dana.angluin@yale.edu","institution_ids":["https://openalex.org/I32971472"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036026526","display_name":"David Chiang","orcid":"https://orcid.org/0000-0002-0435-4864"},"institutions":[{"id":"https://openalex.org/I107639228","display_name":"University of Notre Dame","ror":"https://ror.org/00mkhxb43","country_code":"US","type":"education","lineage":["https://openalex.org/I107639228"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"David Chiang","raw_affiliation_strings":["University of Notre Dame, USA. dchiang@nd.edu"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Notre Dame, USA. dchiang@nd.edu","institution_ids":["https://openalex.org/I107639228"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015005264","display_name":"Jonathan Rawski","orcid":"https://orcid.org/0000-0003-3996-9815"},"institutions":[{"id":"https://openalex.org/I51504820","display_name":"San Jose State University","ror":"https://ror.org/04qyvz380","country_code":"US","type":"education","lineage":["https://openalex.org/I51504820"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jonathan Rawski","raw_affiliation_strings":["San Jos\u00e9 State University, USA. jon.rawski@sjsu.edu"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"San Jos\u00e9 State University, USA. jon.rawski@sjsu.edu","institution_ids":["https://openalex.org/I51504820"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5077726785","display_name":"Ashish Sabharwal","orcid":null},"institutions":[{"id":"https://openalex.org/I4210140341","display_name":"Allen Institute","ror":"https://ror.org/03cpe7c52","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I4210140341"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ashish Sabharwal","raw_affiliation_strings":["Allen Institute for AI, USA. ashishs@allenai.org"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Allen Institute for AI, USA. ashishs@allenai.org","institution_ids":["https://openalex.org/I4210140341"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5092616543"],"corresponding_institution_ids":["https://openalex.org/I90267481"],"apc_list":null,"apc_paid":null,"fwci":1.9057,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.86221461,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":"13","issue":null,"first_page":"200","last_page":"219"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9898999929428101,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9898999929428101,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9860000014305115,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11567","display_name":"semigroups and automata theory","score":0.9771000146865845,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7919126749038696},{"id":"https://openalex.org/keywords/transducer","display_name":"Transducer","score":0.6021292209625244},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.5941919088363647},{"id":"https://openalex.org/keywords/electrical-engineering","display_name":"Electrical engineering","score":0.35504668951034546},{"id":"https://openalex.org/keywords/voltage","display_name":"Voltage","score":0.16053369641304016},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.09144142270088196}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7919126749038696},{"id":"https://openalex.org/C56318395","wikidata":"https://www.wikidata.org/wiki/Q215928","display_name":"Transducer","level":2,"score":0.6021292209625244},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.5941919088363647},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.35504668951034546},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.16053369641304016},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.09144142270088196}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1162/tacl_a_00736","is_oa":true,"landing_page_url":"https://doi.org/10.1162/tacl_a_00736","pdf_url":"https://direct.mit.edu/tacl/article-pdf/doi/10.1162/tacl_a_00736/2506494/tacl_a_00736.pdf","source":{"id":"https://openalex.org/S2729999759","display_name":"Transactions of the Association for Computational Linguistics","issn_l":"2307-387X","issn":["2307-387X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Transactions of the Association for Computational Linguistics","raw_type":"journal-article"},{"id":"pmh:oai:DiVA.org:umu-242255","is_oa":true,"landing_page_url":"http://urn.kb.se/resolve?urn=urn:nbn:se:umu:diva-242255","pdf_url":null,"source":{"id":"https://openalex.org/S4306400361","display_name":"DiVA at Ume\u00e5 University (Ume\u00e5 University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I90267481","host_organization_name":"Ume\u00e5 University","host_organization_lineage":["https://openalex.org/I90267481"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:scholarworks.sjsu.edu:faculty_rsca-7168","is_oa":true,"landing_page_url":"https://scholarworks.sjsu.edu/faculty_rsca/6169","pdf_url":null,"source":{"id":"https://openalex.org/S4377196389","display_name":"San Jos\u00e9 State University ScholarWorks (San Jose State University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I51504820","host_organization_name":"San Jose State University","host_organization_lineage":["https://openalex.org/I51504820"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Faculty Research, Scholarly, and Creative Activity","raw_type":"text"}],"best_oa_location":{"id":"doi:10.1162/tacl_a_00736","is_oa":true,"landing_page_url":"https://doi.org/10.1162/tacl_a_00736","pdf_url":"https://direct.mit.edu/tacl/article-pdf/doi/10.1162/tacl_a_00736/2506494/tacl_a_00736.pdf","source":{"id":"https://openalex.org/S2729999759","display_name":"Transactions of the Association for Computational Linguistics","issn_l":"2307-387X","issn":["2307-387X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Transactions of the Association for Computational Linguistics","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4408105704.pdf","grobid_xml":"https://content.openalex.org/works/W4408105704.grobid-xml"},"referenced_works_count":27,"referenced_works":["https://openalex.org/W1583837637","https://openalex.org/W1997049674","https://openalex.org/W2060270693","https://openalex.org/W2116250539","https://openalex.org/W2125529971","https://openalex.org/W2274615375","https://openalex.org/W2531193976","https://openalex.org/W2897955526","https://openalex.org/W2952744660","https://openalex.org/W3014096773","https://openalex.org/W3037332318","https://openalex.org/W3149261839","https://openalex.org/W3175990774","https://openalex.org/W4224874866","https://openalex.org/W4284701759","https://openalex.org/W4285206226","https://openalex.org/W4289856124","https://openalex.org/W4290994975","https://openalex.org/W4310895557","https://openalex.org/W4385008324","https://openalex.org/W4385571157","https://openalex.org/W4394634418","https://openalex.org/W4396767926","https://openalex.org/W6678720029","https://openalex.org/W6739901393","https://openalex.org/W6788417511","https://openalex.org/W6857333724"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2012283803","https://openalex.org/W4384820447","https://openalex.org/W2072454424","https://openalex.org/W2117438306","https://openalex.org/W2185942010","https://openalex.org/W2260725127","https://openalex.org/W2864363823"],"abstract_inverted_index":{"Abstract":[0],"We":[1,28,49],"study":[2],"the":[3,51,65,87],"sequence-to-sequence":[4,57],"mapping":[5],"capacity":[6],"of":[7,24,33,90],"transformers":[8,126],"by":[9],"relating":[10],"them":[11],"to":[12,39,56],"finite":[13],"transducers,":[14],"and":[15,59,93,113],"find":[16],"that":[17,61,122],"they":[18],"can":[19,127],"express":[20],"surprisingly":[21],"large":[22],"classes":[23],"(total":[25],"functional)":[26],"transductions.":[27,98,118],"do":[29],"so":[30],"using":[31],"variants":[32],"RASP,":[34],"a":[35,91,111],"programming":[36],"language":[37],"designed":[38],"help":[40],"people":[41],"\u201cthink":[42],"like":[43],"transformers,\u201d":[44],"as":[45,70,85,109],"an":[46],"intermediate":[47],"representation.":[48],"extend":[50],"existing":[52],"Boolean":[53],"variant":[54],"B-RASP":[55],"transductions":[58,68],"show":[60,121],"it":[62],"computes":[63],"exactly":[64],"first-order":[66,96,116],"rational":[67],"(such":[69,84,108],"string":[71],"rotation).":[72],"Then,":[73],"we":[74,120],"introduce":[75],"two":[76],"new":[77],"extensions.":[78],"B-RASP[pos]":[79],"enables":[80,104],"calculations":[81],"on":[82],"positions":[83],"copying":[86],"first":[88],"half":[89],"string)":[92,112],"contains":[94,114],"all":[95,115],"regular":[97],"S-RASP":[99],"adds":[100],"prefix":[101],"sum,":[102],"which":[103],"additional":[105],"arithmetic":[106],"operations":[107],"squaring":[110],"polyregular":[117],"Finally,":[119],"masked":[123],"average-hard":[124],"attention":[125],"simulate":[128],"S-RASP.":[129]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
