{"id":"https://openalex.org/W7138942011","doi":"https://doi.org/10.48550/arxiv.2603.15953","title":"A Family of LLMs Liberated from Static Vocabularies","display_name":"A Family of LLMs Liberated from Static Vocabularies","publication_year":2026,"publication_date":"2026-03-16","ids":{"openalex":"https://openalex.org/W7138942011","doi":"https://doi.org/10.48550/arxiv.2603.15953"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.15953","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.15953","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.15953","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5130040763","display_name":"Aleph Alpha","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alpha, Aleph","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129852740","display_name":":","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":":","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006478413","display_name":"Adnen Abdessaied","orcid":"https://orcid.org/0000-0002-9489-6340"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Abdessaied, Adnen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035498724","display_name":"Artur Baranowski","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Baranowski, Artur","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129807204","display_name":"Lukas Balles","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Balles, Lukas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130087687","display_name":"Michael Barlow","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Barlow, Michael","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057903433","display_name":"Fabien Benureau","orcid":"https://orcid.org/0000-0003-4083-4512"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Benureau, Fabien C. Y.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130169516","display_name":"Felix Berkenkamp","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Berkenkamp, Felix","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129909023","display_name":"Lukas Bluebaum","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bluebaum, Lukas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049893678","display_name":"Bastian Boll","orcid":"https://orcid.org/0000-0002-3490-3350"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Boll, Bastian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042575470","display_name":"Thomas F Burns","orcid":"https://orcid.org/0000-0002-1123-2929"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Burns, Thomas F.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129824783","display_name":"Bj\u00f6rn Deiseroth","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Deiseroth, Bj\u00f6rn","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036135663","display_name":"Constantin Eichenberg","orcid":"https://orcid.org/0000-0002-9973-2687"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Eichenberg, Constantin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130195304","display_name":"David Friede","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Friede, David","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129944207","display_name":"Pablo Iyu Guerrero","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guerrero, Pablo Iyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130163521","display_name":"Ahmed Hammam","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hammam, Ahmed","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024191282","display_name":"Bastian Harren","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Harren, Bastian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087581366","display_name":"J. Higl","orcid":"https://orcid.org/0000-0001-9697-6558"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Higl, Johann","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129947788","display_name":"Yasser Jadidi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jadidi, Yasser","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024327650","display_name":"Carina Kauf","orcid":"https://orcid.org/0000-0002-2718-1978"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kauf, Carina","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009238504","display_name":"Johannes Messner","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Messner, Johannes","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049054914","display_name":"Jan Hendrik Metzen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Metzen, Jan Hendrik","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5093211853","display_name":"Max Meuer","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Meuer, Max","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048896019","display_name":"Vedant Nanda","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nanda, Vedant","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115944809","display_name":"Pit Neitemeier","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Neitemeier, Pit","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058203980","display_name":"Koen Oostermeijer","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Oostermeijer, Koen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130120283","display_name":"Letitia Parcalabescu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Parcalabescu, Letitia","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129945795","display_name":"Markus Pernpointner","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pernpointner, Markus","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130139545","display_name":"Felix Reinfurt","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Reinfurt, Felix","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129836066","display_name":"Dylan Rodriquez","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rodriquez, Dylan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109811864","display_name":"G. Schott","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Schott, Gr\u00e9gory","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074584188","display_name":"Philipp Siedler","orcid":"https://orcid.org/0000-0002-2284-1674"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Siedler, Philipp","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026733401","display_name":"Martin Simonovsky","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Simonovsky, Martin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127856319","display_name":"Till Speicher","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Speicher, Till","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130017728","display_name":"Volker Stampa","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Stampa, Volker","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129779635","display_name":"Stephan W\u00e4ldchen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"W\u00e4ldchen, Stephan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055789969","display_name":"Samuel Weinbach","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Weinbach, Samuel","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5129821029","display_name":"Gregor Ziegltrum","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ziegltrum, Gregor","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":38,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.35109999775886536,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.35109999775886536,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.2538999915122986,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.04270000010728836,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.6098999977111816},{"id":"https://openalex.org/keywords/byte","display_name":"Byte","score":0.5217999815940857},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.5123000144958496},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.48510000109672546},{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.478300005197525},{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.44929999113082886},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.44830000400543213},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.4388999938964844},{"id":"https://openalex.org/keywords/autoregressive-model","display_name":"Autoregressive model","score":0.42419999837875366}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6208000183105469},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.6098999977111816},{"id":"https://openalex.org/C43364308","wikidata":"https://www.wikidata.org/wiki/Q8799","display_name":"Byte","level":2,"score":0.5217999815940857},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.5123000144958496},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4945000112056732},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4864000082015991},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.48510000109672546},{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.478300005197525},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.44929999113082886},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.44830000400543213},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.4388999938964844},{"id":"https://openalex.org/C159877910","wikidata":"https://www.wikidata.org/wiki/Q2202883","display_name":"Autoregressive model","level":2,"score":0.42419999837875366},{"id":"https://openalex.org/C206588197","wikidata":"https://www.wikidata.org/wiki/Q846574","display_name":"Reuse","level":2,"score":0.3707999885082245},{"id":"https://openalex.org/C141603448","wikidata":"https://www.wikidata.org/wiki/Q134830","display_name":"Prefix","level":2,"score":0.36559998989105225},{"id":"https://openalex.org/C166955791","wikidata":"https://www.wikidata.org/wiki/Q629579","display_name":"Macro","level":2,"score":0.3395000100135803},{"id":"https://openalex.org/C48372109","wikidata":"https://www.wikidata.org/wiki/Q3913","display_name":"Binary number","level":2,"score":0.301800012588501},{"id":"https://openalex.org/C2776187449","wikidata":"https://www.wikidata.org/wiki/Q1513879","display_name":"Natural language generation","level":3,"score":0.30160000920295715},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.2948000133037567},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.29330000281333923},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.29319998621940613},{"id":"https://openalex.org/C100279451","wikidata":"https://www.wikidata.org/wiki/Q372193","display_name":"Perplexity","level":3,"score":0.2858000099658966},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.28519999980926514},{"id":"https://openalex.org/C177606310","wikidata":"https://www.wikidata.org/wiki/Q5674297","display_name":"Adaptability","level":2,"score":0.2808000147342682},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.2721000015735626},{"id":"https://openalex.org/C24338571","wikidata":"https://www.wikidata.org/wiki/Q2566298","display_name":"Autoregressive integrated moving average","level":3,"score":0.26910001039505005},{"id":"https://openalex.org/C70437156","wikidata":"https://www.wikidata.org/wiki/Q7228652","display_name":"Pooling","level":2,"score":0.26260000467300415},{"id":"https://openalex.org/C137212723","wikidata":"https://www.wikidata.org/wiki/Q1948412","display_name":"Morphism","level":2,"score":0.26089999079704285}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.15953","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.15953","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.15953","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.15953","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.7421536445617676,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Tokenization":[0],"is":[1],"a":[2,50,85,172],"central":[3],"component":[4],"of":[5,52,91,165,196],"natural":[6],"language":[7,12],"processing":[8],"in":[9,221,229,238],"current":[10],"large":[11],"models":[13,16,53,113,122,132,244],"(LLMs),":[14],"enabling":[15],"to":[17,43,56,82,160,203],"convert":[18],"raw":[19],"text":[20,190],"into":[21,75,103,123],"processable":[22],"units.":[23],"Although":[24],"learned":[25],"tokenizers":[26],"are":[27,94,130,137],"widely":[28],"adopted,":[29],"they":[30],"exhibit":[31],"notable":[32],"limitations,":[33],"including":[34],"their":[35],"large,":[36],"fixed":[37],"vocabulary":[38],"sizes":[39],"and":[40,78,100,120,128,135,157,200,217,223],"poor":[41],"adaptability":[42],"new":[44],"domains":[45],"or":[46],"languages.":[47],"We":[48,105,169,241],"present":[49],"family":[51],"with":[54,153],"up":[55],"70":[57],"billion":[58],"parameters":[59],"based":[60],"on":[61,181,233,249],"the":[62,83,92,98,116,124,145,150,154,166,194,234],"hierarchical":[63],"autoregressive":[64,87],"transformer":[65,72,151],"(HAT)":[66],"architecture.":[67],"In":[68],"HAT,":[69],"an":[70],"encoder":[71,134],"aggregates":[73],"bytes":[74],"word":[76,162],"embeddings":[77,163],"then":[79,95],"feeds":[80],"them":[81],"backbone,":[84,148],"classical":[86],"transformer.":[88],"The":[89,186],"outputs":[90],"backbone":[93],"cross-attended":[96],"by":[97,114,192],"decoder":[99,136],"converted":[101],"back":[102],"bytes.":[104],"show":[106,226],"that":[107],"we":[108,143,225],"can":[109],"reuse":[110],"available":[111],"pre-trained":[112,146],"converting":[115],"Llama":[117,147,236],"3.1":[118,237],"8B":[119],"70B":[121],"HAT":[125,174,187],"architecture:":[126],"Llama-3.1-8B-TFree-HAT":[127],"Llama-3.1-70B-TFree-HAT":[129],"byte-level":[131],"whose":[133],"trained":[138,177],"from":[139,179],"scratch,":[140],"but":[141],"where":[142],"adapt":[144],"i.e.,":[149],"blocks":[152],"embedding":[155],"matrix":[156],"head":[158],"removed,":[159],"handle":[161],"instead":[164],"original":[167,235],"tokens.":[168],"also":[170],"provide":[171],"7B":[173],"model,":[175],"Llama-TFree-HAT-Pretrained,":[176],"entirely":[178],"scratch":[180],"nearly":[182],"4":[183],"trillion":[184],"words.":[185],"architecture":[188],"improves":[189],"compression":[191],"reducing":[193],"number":[195],"required":[197],"sequence":[198],"positions":[199],"enhances":[201],"robustness":[202],"intra-word":[204],"variations,":[205],"e.g.,":[206],"spelling":[207],"differences.":[208],"Through":[209],"pre-training,":[210],"as":[211,213],"well":[212],"subsequent":[214],"supervised":[215],"fine-tuning":[216],"direct":[218],"preference":[219],"optimization":[220],"English":[222],"German,":[224],"strong":[227],"proficiency":[228],"both":[230],"languages,":[231],"improving":[232],"most":[239],"benchmarks.":[240],"release":[242],"our":[243],"(including":[245],"200":[246],"pre-training":[247],"checkpoints)":[248],"Hugging":[250],"Face.":[251]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-20T00:00:00"}
