{"id":"https://openalex.org/W4312558730","doi":"https://doi.org/10.1162/tacl_a_00510","title":"Getting BART to Ride the Idiomatic Train: Learning to Represent Idiomatic Expressions","display_name":"Getting BART to Ride the Idiomatic Train: Learning to Represent Idiomatic Expressions","publication_year":2022,"publication_date":"2022-01-01","ids":{"openalex":"https://openalex.org/W4312558730","doi":"https://doi.org/10.1162/tacl_a_00510"},"language":"en","primary_location":{"id":"doi:10.1162/tacl_a_00510","is_oa":true,"landing_page_url":"https://doi.org/10.1162/tacl_a_00510","pdf_url":"https://direct.mit.edu/tacl/article-pdf/doi/10.1162/tacl_a_00510/2054693/tacl_a_00510.pdf","source":{"id":"https://openalex.org/S2729999759","display_name":"Transactions of the Association for Computational Linguistics","issn_l":"2307-387X","issn":["2307-387X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Transactions of the Association for Computational Linguistics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://direct.mit.edu/tacl/article-pdf/doi/10.1162/tacl_a_00510/2054693/tacl_a_00510.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110723518","display_name":"Ziheng Zeng","orcid":null},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Ziheng Zeng","raw_affiliation_strings":["Department of Electrical and Computer Engineering University of Illinois at Urbana-Champaign Champaign, IL USA zzeng13@illinois.edu"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering University of Illinois at Urbana-Champaign Champaign, IL USA zzeng13@illinois.edu","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5083777443","display_name":"Suma Bhat","orcid":"https://orcid.org/0000-0003-0324-5890"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Suma Bhat","raw_affiliation_strings":["Department of Electrical and Computer Engineering University of Illinois at Urbana-Champaign Champaign, IL USA spbhat2@illinois.edu"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering University of Illinois at Urbana-Champaign Champaign, IL USA spbhat2@illinois.edu","institution_ids":["https://openalex.org/I157725225"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5083777443","https://openalex.org/A5110723518"],"corresponding_institution_ids":["https://openalex.org/I157725225"],"apc_list":null,"apc_paid":null,"fwci":0.8332,"has_fulltext":true,"cited_by_count":6,"citation_normalized_percentile":{"value":0.78347581,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":97},"biblio":{"volume":"10","issue":null,"first_page":"1120","last_page":"1137"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9815999865531921,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8220720291137695},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.7446799278259277},{"id":"https://openalex.org/keywords/principle-of-compositionality","display_name":"Principle of compositionality","score":0.7332537770271301},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5969148874282837},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.5548756122589111},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5455054044723511},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.4724234342575073},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.45151519775390625}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8220720291137695},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.7446799278259277},{"id":"https://openalex.org/C121375916","wikidata":"https://www.wikidata.org/wiki/Q936559","display_name":"Principle of compositionality","level":2,"score":0.7332537770271301},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5969148874282837},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.5548756122589111},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5455054044723511},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.4724234342575073},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.45151519775390625},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1162/tacl_a_00510","is_oa":true,"landing_page_url":"https://doi.org/10.1162/tacl_a_00510","pdf_url":"https://direct.mit.edu/tacl/article-pdf/doi/10.1162/tacl_a_00510/2054693/tacl_a_00510.pdf","source":{"id":"https://openalex.org/S2729999759","display_name":"Transactions of the Association for Computational Linguistics","issn_l":"2307-387X","issn":["2307-387X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Transactions of the Association for Computational Linguistics","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:ffd6eae464904473acc8abffc94c8b8c","is_oa":true,"landing_page_url":"https://doaj.org/article/ffd6eae464904473acc8abffc94c8b8c","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Transactions of the Association for Computational Linguistics, Vol 10, Pp 1120-1137 (2022)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1162/tacl_a_00510","is_oa":true,"landing_page_url":"https://doi.org/10.1162/tacl_a_00510","pdf_url":"https://direct.mit.edu/tacl/article-pdf/doi/10.1162/tacl_a_00510/2054693/tacl_a_00510.pdf","source":{"id":"https://openalex.org/S2729999759","display_name":"Transactions of the Association for Computational Linguistics","issn_l":"2307-387X","issn":["2307-387X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Transactions of the Association for Computational Linguistics","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.8500000238418579,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4312558730.pdf","grobid_xml":"https://content.openalex.org/works/W4312558730.grobid-xml"},"referenced_works_count":63,"referenced_works":["https://openalex.org/W110339475","https://openalex.org/W172541218","https://openalex.org/W630883834","https://openalex.org/W1498763386","https://openalex.org/W1965879064","https://openalex.org/W2032532403","https://openalex.org/W2123215530","https://openalex.org/W2252211741","https://openalex.org/W2508425840","https://openalex.org/W2517996181","https://openalex.org/W2525778437","https://openalex.org/W2594108681","https://openalex.org/W2604760609","https://openalex.org/W2795843251","https://openalex.org/W2826721128","https://openalex.org/W2903908711","https://openalex.org/W2949445359","https://openalex.org/W2956530858","https://openalex.org/W2962688231","https://openalex.org/W2962784628","https://openalex.org/W2962945654","https://openalex.org/W2964274713","https://openalex.org/W2970641574","https://openalex.org/W2970925270","https://openalex.org/W2971044268","https://openalex.org/W2979826702","https://openalex.org/W3012932209","https://openalex.org/W3034760557","https://openalex.org/W3034999214","https://openalex.org/W3099793224","https://openalex.org/W3101498587","https://openalex.org/W3155744586","https://openalex.org/W3173281684","https://openalex.org/W3197690918","https://openalex.org/W3202282051","https://openalex.org/W3206846084","https://openalex.org/W3207350353","https://openalex.org/W3207539211","https://openalex.org/W3214523360","https://openalex.org/W3214578205","https://openalex.org/W4221086658","https://openalex.org/W4226190794","https://openalex.org/W4388119441","https://openalex.org/W6601031416","https://openalex.org/W6601655871","https://openalex.org/W6636771696","https://openalex.org/W6675354045","https://openalex.org/W6691444529","https://openalex.org/W6726295259","https://openalex.org/W6732015709","https://openalex.org/W6738045163","https://openalex.org/W6744777068","https://openalex.org/W6748819318","https://openalex.org/W6752410594","https://openalex.org/W6759579507","https://openalex.org/W6776148200","https://openalex.org/W6778777187","https://openalex.org/W6778883912","https://openalex.org/W6788219984","https://openalex.org/W6791353385","https://openalex.org/W6795436826","https://openalex.org/W6798057236","https://openalex.org/W6893231364"],"related_works":["https://openalex.org/W3095531775","https://openalex.org/W1526190050","https://openalex.org/W4251923961","https://openalex.org/W2477397717","https://openalex.org/W2010490241","https://openalex.org/W2500457737","https://openalex.org/W4287025733","https://openalex.org/W3192500523","https://openalex.org/W4317425742","https://openalex.org/W86971241"],"abstract_inverted_index":{"Abstract":[0],"Idiomatic":[1],"expressions":[2],"(IEs),":[3],"characterized":[4],"by":[5],"their":[6,37],"non-compositionality,":[7],"are":[8],"an":[9,62],"important":[10],"part":[11],"of":[12,46,113],"natural":[13],"language.":[14],"They":[15],"have":[16],"been":[17],"a":[18,53,65],"classical":[19],"challenge":[20],"to":[21,56,103],"NLP,":[22],"including":[23],"pre-trained":[24],"language":[25,68],"models":[26],"that":[27],"drive":[28],"today\u2019s":[29],"state-of-the-art.":[30],"Prior":[31],"work":[32],"has":[33],"identified":[34],"deficiencies":[35],"in":[36,95],"contextualized":[38],"representation":[39],"stemming":[40],"from":[41],"the":[42,109],"underlying":[43],"compositional":[44],"paradigm":[45],"representation.":[47],"In":[48],"this":[49],"work,":[50],"we":[51],"take":[52],"first-principles":[54],"approach":[55],"build":[57],"idiomaticity":[58],"into":[59],"BART":[60],"using":[61],"adapter":[63],"as":[64],"lightweight":[66],"non-compositional":[67],"expert":[69],"trained":[70],"on":[71,108],"idiomatic":[72],"sentences.":[73],"The":[74],"improved":[75],"capability":[76],"over":[77],"baselines":[78],"(e.g.,":[79],"BART)":[80],"is":[81],"seen":[82],"via":[83],"intrinsic":[84],"and":[85,101,117],"extrinsic":[86],"methods,":[87],"where":[88],"idiom":[89,110],"embeddings":[90],"score":[91,97],"0.19":[92],"points":[93],"higher":[94,105],"homogeneity":[96],"for":[98],"embedding":[99],"clustering,":[100],"up":[102],"25%":[104],"sequence":[106],"accuracy":[107],"processing":[111],"tasks":[112],"IE":[114],"sense":[115],"disambiguation":[116],"span":[118],"detection.":[119]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":3}],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-10T00:00:00"}
