{"id":"https://openalex.org/W2626778328","doi":"https://doi.org/10.65215/2q58a426","title":"Attention Is All You Need","display_name":"Attention Is All You Need","publication_year":2025,"publication_date":"2025-08-23","ids":{"openalex":"https://openalex.org/W2626778328","doi":"https://doi.org/10.65215/2q58a426","mag":"2626778328"},"language":"en","primary_location":{"id":"doi:10.65215/2q58a426","is_oa":false,"landing_page_url":"https://doi.org/10.65215/2q58a426","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"posted-content"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://langtaosha.org.cn/index.php/lts/preprint/download/10/108","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103024730","display_name":"Ashish Vaswani","orcid":"https://orcid.org/0000-0002-7794-2085"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Ashish Vaswani","raw_affiliation_strings":["Google Brain","Google (United States), Mountain View, United States"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Google Brain","institution_ids":["https://openalex.org/I1291425158"]},{"raw_affiliation_string":"Google (United States), Mountain View, United States","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021878400","display_name":"Noam Shazeer","orcid":null},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Noam Shazeer","raw_affiliation_strings":["Google Brain","Google (United States), Mountain View, United States"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Google Brain","institution_ids":["https://openalex.org/I1291425158"]},{"raw_affiliation_string":"Google (United States), Mountain View, United States","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005777963","display_name":"Niki Parmar","orcid":null},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]},{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Niki Parmar","raw_affiliation_strings":["Google Research","University of Southern California, Los Angeles, United States"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Google Research","institution_ids":["https://openalex.org/I1291425158"]},{"raw_affiliation_string":"University of Southern California, Los Angeles, United States","institution_ids":["https://openalex.org/I1174212"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022416424","display_name":"Jakob Uszkoreit","orcid":"https://orcid.org/0000-0001-5066-7530"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jakob Uszkoreit","raw_affiliation_strings":["Google Research","Google (United States), Mountain View, United States"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Google Research","institution_ids":["https://openalex.org/I1291425158"]},{"raw_affiliation_string":"Google (United States), Mountain View, United States","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023448834","display_name":"Llion Jones","orcid":null},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Llion Jones","raw_affiliation_strings":["Google Research","Google (United States), Mountain View, United States"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Google Research","institution_ids":["https://openalex.org/I1291425158"]},{"raw_affiliation_string":"Google (United States), Mountain View, United States","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079288315","display_name":"Aidan N. Gomez","orcid":"https://orcid.org/0000-0001-5601-5437"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I185261750","display_name":"University of Toronto","ror":"https://ror.org/03dbr7087","country_code":"CA","type":"education","lineage":["https://openalex.org/I185261750"]}],"countries":["CA","US"],"is_corresponding":false,"raw_author_name":"Aidan N.Gomez","raw_affiliation_strings":["University of Toronto","Google (United States), Mountain View, United States"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Toronto","institution_ids":["https://openalex.org/I185261750"]},{"raw_affiliation_string":"Google (United States), Mountain View, United States","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031789995","display_name":"\u0141ukasz Kaiser","orcid":"https://orcid.org/0000-0003-1092-6010"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Lukasz Kaiser","raw_affiliation_strings":["Google Brain","Google (United States), Mountain View, United States"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Google Brain","institution_ids":["https://openalex.org/I1291425158"]},{"raw_affiliation_string":"Google (United States), Mountain View, United States","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5045719436","display_name":"Illia Polosukhin","orcid":null},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Illia Polosukhin","raw_affiliation_strings":["Google (United States), Mountain View, United States"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Google (United States), Mountain View, United States","institution_ids":["https://openalex.org/I1291425158"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5103024730"],"corresponding_institution_ids":["https://openalex.org/I1291425158"],"apc_list":null,"apc_paid":null,"fwci":156.2626,"has_fulltext":false,"cited_by_count":6551,"citation_normalized_percentile":{"value":0.99983993,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":"30","issue":null,"first_page":"5998","last_page":"6008"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.993399977684021,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9887999892234802,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8567242622375488},{"id":"https://openalex.org/keywords/machine-translation","display_name":"Machine translation","score":0.8367122411727905},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.7707333564758301},{"id":"https://openalex.org/keywords/bleu","display_name":"BLEU","score":0.7233442068099976},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.6436600685119629},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6131019592285156},{"id":"https://openalex.org/keywords/parallelizable-manifold","display_name":"Parallelizable manifold","score":0.5284521579742432},{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.5106223225593567},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.4961920380592346},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.49199363589286804},{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.4886353611946106},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.48495081067085266},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.42289119958877563},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3937355577945709},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3607896566390991},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.14444169402122498}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8567242622375488},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.8367122411727905},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.7707333564758301},{"id":"https://openalex.org/C622187","wikidata":"https://www.wikidata.org/wiki/Q3500773","display_name":"BLEU","level":3,"score":0.7233442068099976},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.6436600685119629},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6131019592285156},{"id":"https://openalex.org/C148047603","wikidata":"https://www.wikidata.org/wiki/Q1014612","display_name":"Parallelizable manifold","level":2,"score":0.5284521579742432},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.5106223225593567},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.4961920380592346},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.49199363589286804},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.4886353611946106},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.48495081067085266},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.42289119958877563},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3937355577945709},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3607896566390991},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.14444169402122498},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":11,"locations":[{"id":"doi:10.65215/2q58a426","is_oa":false,"landing_page_url":"https://doi.org/10.65215/2q58a426","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"posted-content"},{"id":"doi:10.65215/ctdc8e75","is_oa":false,"landing_page_url":"https://doi.org/10.65215/ctdc8e75","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"posted-content"},{"id":"doi:10.65215/mdcm8z23","is_oa":false,"landing_page_url":"https://doi.org/10.65215/mdcm8z23","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"posted-content"},{"id":"doi:10.65215/ne77pf66","is_oa":false,"landing_page_url":"https://doi.org/10.65215/ne77pf66","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"posted-content"},{"id":"doi:10.65215/nxvz2v36","is_oa":false,"landing_page_url":"https://doi.org/10.65215/nxvz2v36","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"posted-content"},{"id":"doi:10.65215/pc26a033","is_oa":false,"landing_page_url":"https://doi.org/10.65215/pc26a033","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"posted-content"},{"id":"doi:10.65215/r5bs2d54","is_oa":true,"landing_page_url":"https://doi.org/10.65215/r5bs2d54","pdf_url":"https://langtaosha.org.cn/index.php/lts/preprint/download/10/108","source":null,"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"posted-content"},{"id":"doi:10.65215/ysbyhc05","is_oa":false,"landing_page_url":"https://doi.org/10.65215/ysbyhc05","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"posted-content"},{"id":"pmh:oai:arXiv.org:1706.03762","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1706.03762","pdf_url":"https://arxiv.org/pdf/1706.03762","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.1706.03762","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1706.03762","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"},{"id":"mag:2963403868","is_oa":true,"landing_page_url":"https://arxiv.org/pdf/1706.03762v5","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":"arXiv (Cornell University)","raw_type":null}],"best_oa_location":{"id":"doi:10.65215/r5bs2d54","is_oa":true,"landing_page_url":"https://doi.org/10.65215/r5bs2d54","pdf_url":"https://langtaosha.org.cn/index.php/lts/preprint/download/10/108","source":null,"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"posted-content"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.550000011920929}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2626778328.pdf","grobid_xml":"https://content.openalex.org/works/W2626778328.grobid-xml"},"referenced_works_count":28,"referenced_works":["https://openalex.org/W1632114991","https://openalex.org/W1810943226","https://openalex.org/W1902237438","https://openalex.org/W2113691817","https://openalex.org/W2126433015","https://openalex.org/W2139621418","https://openalex.org/W2163568299","https://openalex.org/W2194775991","https://openalex.org/W2259472270","https://openalex.org/W2289899728","https://openalex.org/W2514713644","https://openalex.org/W2525778437","https://openalex.org/W2545625743","https://openalex.org/W2594990650","https://openalex.org/W2605203995","https://openalex.org/W2612675303","https://openalex.org/W2613904329","https://openalex.org/W2949847915","https://openalex.org/W2951008357","https://openalex.org/W2951583185","https://openalex.org/W2952191002","https://openalex.org/W2952339051","https://openalex.org/W2962784628","https://openalex.org/W2963069010","https://openalex.org/W2963187627","https://openalex.org/W2963991316","https://openalex.org/W2964121744","https://openalex.org/W2964308564"],"related_works":["https://openalex.org/W2965373594","https://openalex.org/W2964308564","https://openalex.org/W2964121744","https://openalex.org/W2963341956","https://openalex.org/W2963091558","https://openalex.org/W2962784628","https://openalex.org/W2950577311","https://openalex.org/W2950133940","https://openalex.org/W2949888546","https://openalex.org/W2787560479","https://openalex.org/W2525778437","https://openalex.org/W2250539671","https://openalex.org/W2194775991","https://openalex.org/W2163605009","https://openalex.org/W2157331557","https://openalex.org/W2108598243","https://openalex.org/W2101105183","https://openalex.org/W2095705004","https://openalex.org/W2064675550","https://openalex.org/W1902237438"],"abstract_inverted_index":{"The":[0,18],"dominant":[1],"sequence":[2],"transduction":[3],"models":[4,21,60,137],"are":[5],"based":[6,41],"on":[7,43,53,82,124],"complex":[8],"recurrent":[9],"or":[10],"convolutional":[11],"neural":[12],"networks":[13],"in":[14,64],"an":[15,29],"encoder-decoder":[16],"configuration.":[17],"best":[19,93,136],"performing":[20],"also":[22],"connect":[23],"the":[24,39,83,91,102,131,135,139,144],"encoder":[25],"and":[26,49,70,162],"decoder":[27],"through":[28],"attention":[30,44],"mechanism.":[31],"We":[32,141],"propose":[33],"a":[34,111,127],"new":[35,112],"simple":[36],"network":[37],"architecture,":[38],"Transformer,":[40],"solely":[42],"mechanisms,":[45],"dispensing":[46],"with":[47,160],"recurrence":[48],"convolutions":[50],"entirely.":[51],"Experiments":[52],"two":[54],"machine":[55],"translation":[56,87,106],"tasks":[57,150],"show":[58,142],"these":[59],"to":[61,75,148,155],"be":[62],"superior":[63],"quality":[65],"while":[66],"being":[67],"more":[68],"parallelizable":[69],"requiring":[71],"significantly":[72],"less":[73],"time":[74],"train.":[76],"Our":[77],"model":[78,109],"achieves":[79],"28.4":[80],"BLEU":[81,115],"WMT":[84,103],"2014":[85,104],"English-to-German":[86],"task,":[88,107],"improving":[89],"over":[90,98],"existing":[92],"results,":[94],"including":[95],"ensembles":[96],"by":[97,151],"2":[99],"BLEU.":[100],"On":[101],"English-to-French":[105],"our":[108],"establishes":[110],"single-model":[113],"state-of-the-art":[114],"score":[116],"of":[117,130,134],"41.8":[118],"after":[119],"training":[120,132,164],"for":[121],"3.5":[122],"days":[123],"eight":[125],"GPUs,":[126],"small":[128],"fraction":[129],"costs":[133],"from":[138],"literature.":[140],"that":[143],"Transformer":[145],"generalizes":[146],"well":[147],"other":[149],"applying":[152],"it":[153],"successfully":[154],"English":[156],"constituency":[157],"parsing":[158],"both":[159],"large":[161],"limited":[163],"data.":[165]},"counts_by_year":[{"year":2026,"cited_by_count":60},{"year":2025,"cited_by_count":23},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":18},{"year":2022,"cited_by_count":176},{"year":2021,"cited_by_count":2998},{"year":2020,"cited_by_count":1819},{"year":2019,"cited_by_count":955},{"year":2018,"cited_by_count":447},{"year":2017,"cited_by_count":49},{"year":2012,"cited_by_count":1}],"updated_date":"2026-05-28T09:10:13.091523","created_date":"2017-06-23T00:00:00"}
