{"id":"https://openalex.org/W2948947170","doi":"https://doi.org/10.18653/v1/p19-1356","title":"What Does BERT Learn about the Structure of Language?","display_name":"What Does BERT Learn about the Structure of Language?","publication_year":2019,"publication_date":"2019-01-01","ids":{"openalex":"https://openalex.org/W2948947170","doi":"https://doi.org/10.18653/v1/p19-1356","mag":"2948947170"},"language":"en","primary_location":{"id":"doi:10.18653/v1/p19-1356","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p19-1356","pdf_url":"https://www.aclweb.org/anthology/P19-1356.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.aclweb.org/anthology/P19-1356.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5057854225","display_name":"Ganesh Jawahar","orcid":null},"institutions":[{"id":"https://openalex.org/I1326498283","display_name":"Institut national de recherche en informatique et en automatique","ror":"https://ror.org/02kvxyf05","country_code":"FR","type":"funder","lineage":["https://openalex.org/I1326498283"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Ganesh Jawahar","raw_affiliation_strings":["Inria, France","Automatic Language Modelling and ANAlysis & Computational Humanities"],"affiliations":[{"raw_affiliation_string":"Inria, France","institution_ids":["https://openalex.org/I1326498283"]},{"raw_affiliation_string":"Automatic Language Modelling and ANAlysis & Computational Humanities","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077663332","display_name":"Beno\u00eet Sagot","orcid":"https://orcid.org/0000-0002-0107-8526"},"institutions":[{"id":"https://openalex.org/I1326498283","display_name":"Institut national de recherche en informatique et en automatique","ror":"https://ror.org/02kvxyf05","country_code":"FR","type":"funder","lineage":["https://openalex.org/I1326498283"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Beno\u00eet Sagot","raw_affiliation_strings":["Inria, France","Automatic Language Modelling and ANAlysis & Computational Humanities"],"affiliations":[{"raw_affiliation_string":"Inria, France","institution_ids":["https://openalex.org/I1326498283"]},{"raw_affiliation_string":"Automatic Language Modelling and ANAlysis & Computational Humanities","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5010519567","display_name":"Djam\u00e9 Seddah","orcid":null},"institutions":[{"id":"https://openalex.org/I1326498283","display_name":"Institut national de recherche en informatique et en automatique","ror":"https://ror.org/02kvxyf05","country_code":"FR","type":"funder","lineage":["https://openalex.org/I1326498283"]},{"id":"https://openalex.org/I39804081","display_name":"Sorbonne Universit\u00e9","ror":"https://ror.org/02en5vm52","country_code":"FR","type":"education","lineage":["https://openalex.org/I39804081"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Djam\u00e9 Seddah","raw_affiliation_strings":["Inria, France","Sorbonne Universite\u0301"],"affiliations":[{"raw_affiliation_string":"Inria, France","institution_ids":["https://openalex.org/I1326498283"]},{"raw_affiliation_string":"Sorbonne Universite\u0301","institution_ids":["https://openalex.org/I39804081"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5057854225"],"corresponding_institution_ids":["https://openalex.org/I1326498283"],"apc_list":null,"apc_paid":null,"fwci":97.5481,"has_fulltext":true,"cited_by_count":1197,"citation_normalized_percentile":{"value":0.99956323,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"3651","last_page":"3657"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8454751968383789},{"id":"https://openalex.org/keywords/hierarchy","display_name":"Hierarchy","score":0.63039231300354},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6136537790298462},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5649352073669434},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.540395975112915},{"id":"https://openalex.org/keywords/dependency","display_name":"Dependency (UML)","score":0.530394434928894},{"id":"https://openalex.org/keywords/phrase","display_name":"Phrase","score":0.47390544414520264},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.4428033232688904},{"id":"https://openalex.org/keywords/information-structure","display_name":"Information structure","score":0.4338006377220154},{"id":"https://openalex.org/keywords/term","display_name":"Term (time)","score":0.4255511462688446},{"id":"https://openalex.org/keywords/verb-phrase","display_name":"Verb phrase","score":0.4232966899871826},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.369201123714447},{"id":"https://openalex.org/keywords/noun-phrase","display_name":"Noun phrase","score":0.297046422958374},{"id":"https://openalex.org/keywords/noun","display_name":"Noun","score":0.07206112146377563}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8454751968383789},{"id":"https://openalex.org/C31170391","wikidata":"https://www.wikidata.org/wiki/Q188619","display_name":"Hierarchy","level":2,"score":0.63039231300354},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6136537790298462},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5649352073669434},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.540395975112915},{"id":"https://openalex.org/C19768560","wikidata":"https://www.wikidata.org/wiki/Q320727","display_name":"Dependency (UML)","level":2,"score":0.530394434928894},{"id":"https://openalex.org/C2776224158","wikidata":"https://www.wikidata.org/wiki/Q187931","display_name":"Phrase","level":2,"score":0.47390544414520264},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.4428033232688904},{"id":"https://openalex.org/C2779954242","wikidata":"https://www.wikidata.org/wiki/Q6031227","display_name":"Information structure","level":2,"score":0.4338006377220154},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.4255511462688446},{"id":"https://openalex.org/C2779514573","wikidata":"https://www.wikidata.org/wiki/Q1778442","display_name":"Verb phrase","level":4,"score":0.4232966899871826},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.369201123714447},{"id":"https://openalex.org/C153962237","wikidata":"https://www.wikidata.org/wiki/Q1401131","display_name":"Noun phrase","level":3,"score":0.297046422958374},{"id":"https://openalex.org/C121934690","wikidata":"https://www.wikidata.org/wiki/Q1084","display_name":"Noun","level":2,"score":0.07206112146377563},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C34447519","wikidata":"https://www.wikidata.org/wiki/Q179522","display_name":"Market economy","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.18653/v1/p19-1356","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p19-1356","pdf_url":"https://www.aclweb.org/anthology/P19-1356.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics","raw_type":"proceedings-article"},{"id":"pmh:oai:HAL:hal-02131630v1","is_oa":true,"landing_page_url":"https://inria.hal.science/hal-02131630","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"ACL 2019 - 57th Annual Meeting of the Association for Computational Linguistics, Jul 2019, Florence, Italy","raw_type":"Conference papers"}],"best_oa_location":{"id":"doi:10.18653/v1/p19-1356","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p19-1356","pdf_url":"https://www.aclweb.org/anthology/P19-1356.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.8100000023841858,"id":"https://metadata.un.org/sdg/4"}],"awards":[{"id":"https://openalex.org/G3858547910","display_name":null,"funder_award_id":"15-CE38-0011","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G7779877577","display_name":"Parsing the Impossible, Translating the Improbable","funder_award_id":"ANR-16-CE33-0021","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"}],"funders":[{"id":"https://openalex.org/F4320320883","display_name":"Agence Nationale de la Recherche","ror":"https://ror.org/00rbzpz17"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2948947170.pdf","grobid_xml":"https://content.openalex.org/works/W2948947170.grobid-xml"},"referenced_works_count":32,"referenced_works":["https://openalex.org/W1840435438","https://openalex.org/W2064675550","https://openalex.org/W2097606805","https://openalex.org/W2098921539","https://openalex.org/W2187089797","https://openalex.org/W2250539671","https://openalex.org/W2515741950","https://openalex.org/W2549835527","https://openalex.org/W2790235966","https://openalex.org/W2799124508","https://openalex.org/W2888329843","https://openalex.org/W2893141505","https://openalex.org/W2896457183","https://openalex.org/W2906152891","https://openalex.org/W2910243263","https://openalex.org/W2912351236","https://openalex.org/W2923014074","https://openalex.org/W2946359678","https://openalex.org/W2951299559","https://openalex.org/W2962776659","https://openalex.org/W2963013168","https://openalex.org/W2963310665","https://openalex.org/W2963341956","https://openalex.org/W2963403868","https://openalex.org/W2963430224","https://openalex.org/W2964165804","https://openalex.org/W2964204621","https://openalex.org/W2964303116","https://openalex.org/W4288351520","https://openalex.org/W4288631803","https://openalex.org/W4289490673","https://openalex.org/W4385245566"],"related_works":["https://openalex.org/W2039546652","https://openalex.org/W2012262991","https://openalex.org/W2373794620","https://openalex.org/W2067317451","https://openalex.org/W2362158790","https://openalex.org/W2355827199","https://openalex.org/W2387582696","https://openalex.org/W2356074100","https://openalex.org/W2363798100","https://openalex.org/W2618622683"],"abstract_inverted_index":{"BERT":[0,23,102,124],"is":[1,113],"a":[2,42,79,130],"recent":[3],"language":[4,14,52],"representation":[5,63],"model":[6],"that":[7,22,60,74,123,133],"has":[8],"surprisingly":[9],"performed":[10],"well":[11],"in":[12,67,93,129],"diverse":[13],"understanding":[15],"benchmarks.":[16],"This":[17],"result":[18],"indicates":[19],"the":[20,48,68,89,94,100],"possibility":[21],"networks":[24],"capture":[25,126],"structural":[26],"information":[27,66,112,128],"about":[28],"language.":[29],"In":[30],"this":[31,38],"work,":[32],"we":[33,121],"provide":[34],"novel":[35],"support":[36],"for":[37],"claim":[39],"by":[40,55],"performing":[41],"series":[43],"of":[44,50,82],"experiments":[45],"to":[46,105,116],"unpack":[47],"elements":[49],"English":[51],"structure":[53],"learned":[54],"BERT.":[56],"We":[57,71],"first":[58],"show":[59,73,122],"BERT's":[61,75],"phrasal":[62],"captures":[64],"phrase-level":[65],"lower":[69],"layers.":[70],"also":[72],"intermediate":[76],"layers":[77,108],"encode":[78],"rich":[80],"hierarchy":[81],"linguistic":[83,127],"information,":[84],"with":[85],"surface":[86],"features":[87,92,98],"at":[88,99],"bottom,":[90],"syntactic":[91],"middle":[95],"and":[96],"semantic":[97],"top.":[101],"turns":[103],"out":[104],"require":[106],"deeper":[107],"when":[109],"long-distance":[110],"dependency":[111],"required,":[114],"e.g.":[115],"track":[117],"subjectverb":[118],"agreement.":[119],"Finally,":[120],"representations":[125],"compositional":[131],"way":[132],"mimics":[134],"classical,":[135],"tree-like":[136],"structures.":[137]},"counts_by_year":[{"year":2026,"cited_by_count":19},{"year":2025,"cited_by_count":145},{"year":2024,"cited_by_count":141},{"year":2023,"cited_by_count":218},{"year":2022,"cited_by_count":216},{"year":2021,"cited_by_count":250},{"year":2020,"cited_by_count":191},{"year":2019,"cited_by_count":17}],"updated_date":"2026-04-13T07:58:08.660418","created_date":"2025-10-10T00:00:00"}
