{"id":"https://openalex.org/W3121593933","doi":"https://doi.org/10.18653/v1/2021.eacl-main.176","title":"Language Modelling as a Multi-Task Problem","display_name":"Language Modelling as a Multi-Task Problem","publication_year":2021,"publication_date":"2021-01-01","ids":{"openalex":"https://openalex.org/W3121593933","doi":"https://doi.org/10.18653/v1/2021.eacl-main.176","mag":"3121593933"},"language":"en","primary_location":{"id":"doi:10.18653/v1/2021.eacl-main.176","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2021.eacl-main.176","pdf_url":"https://aclanthology.org/2021.eacl-main.176.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 16th Conference of the European Chapter of the Association for Computational Linguistics: Main Volume","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://aclanthology.org/2021.eacl-main.176.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5020867334","display_name":"Lucas Weber","orcid":"https://orcid.org/0000-0002-6877-6935"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Lucas Weber","raw_affiliation_strings":["Pompeu Fabra Univ"],"affiliations":[{"raw_affiliation_string":"Pompeu Fabra Univ","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056188012","display_name":"Jaap Jumelet","orcid":null},"institutions":[{"id":"https://openalex.org/I887064364","display_name":"University of Amsterdam","ror":"https://ror.org/04dkp9463","country_code":"NL","type":"education","lineage":["https://openalex.org/I887064364"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Jaap Jumelet","raw_affiliation_strings":["ILLC, University of Amsterdam","University of Amsterdam"],"affiliations":[{"raw_affiliation_string":"ILLC, University of Amsterdam","institution_ids":["https://openalex.org/I887064364"]},{"raw_affiliation_string":"University of Amsterdam","institution_ids":["https://openalex.org/I887064364"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007465102","display_name":"Elia Bruni","orcid":null},"institutions":[{"id":"https://openalex.org/I170658231","display_name":"Osnabr\u00fcck University","ror":"https://ror.org/04qmmjx98","country_code":"DE","type":"education","lineage":["https://openalex.org/I170658231"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Elia Bruni","raw_affiliation_strings":["IKW, University of Osnabrck"],"affiliations":[{"raw_affiliation_string":"IKW, University of Osnabrck","institution_ids":["https://openalex.org/I170658231"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5018069499","display_name":"Dieuwke Hupkes","orcid":null},"institutions":[{"id":"https://openalex.org/I2252078561","display_name":"Meta (Israel)","ror":"https://ror.org/02388em19","country_code":"IL","type":"company","lineage":["https://openalex.org/I2252078561","https://openalex.org/I4210114444"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Dieuwke Hupkes","raw_affiliation_strings":["Facebook AI Research","Facebook"],"affiliations":[{"raw_affiliation_string":"Facebook AI Research","institution_ids":["https://openalex.org/I2252078561"]},{"raw_affiliation_string":"Facebook","institution_ids":["https://openalex.org/I2252078561"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5020867334"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.01493,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"2049","last_page":"2060"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9921000003814697,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.8761595487594604},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.7604208588600159},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.699182391166687},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5400444269180298},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5122680068016052},{"id":"https://openalex.org/keywords/computational-linguistics","display_name":"Computational linguistics","score":0.4801306426525116},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.46100208163261414},{"id":"https://openalex.org/keywords/applied-linguistics","display_name":"Applied linguistics","score":0.4163759648799896},{"id":"https://openalex.org/keywords/cognitive-science","display_name":"Cognitive science","score":0.3465944528579712},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.2142990231513977}],"concepts":[{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.8761595487594604},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.7604208588600159},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.699182391166687},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5400444269180298},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5122680068016052},{"id":"https://openalex.org/C155092808","wikidata":"https://www.wikidata.org/wiki/Q182557","display_name":"Computational linguistics","level":2,"score":0.4801306426525116},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.46100208163261414},{"id":"https://openalex.org/C167055898","wikidata":"https://www.wikidata.org/wiki/Q321249","display_name":"Applied linguistics","level":2,"score":0.4163759648799896},{"id":"https://openalex.org/C188147891","wikidata":"https://www.wikidata.org/wiki/Q147638","display_name":"Cognitive science","level":1,"score":0.3465944528579712},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.2142990231513977},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":6,"locations":[{"id":"doi:10.18653/v1/2021.eacl-main.176","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2021.eacl-main.176","pdf_url":"https://aclanthology.org/2021.eacl-main.176.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 16th Conference of the European Chapter of the Association for Computational Linguistics: Main Volume","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2101.11287","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2101.11287","pdf_url":"https://arxiv.org/pdf/2101.11287","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},{"id":"pmh:oai:dare.uva.nl:publications/d8da817d-e365-464d-831f-cf637e7d282a","is_oa":true,"landing_page_url":"https://handle.uba.uva.nl/personal/pure/en/publications/language-modelling-as-a-multitask-problem(d8da817d-e365-464d-831f-cf637e7d282a).html","pdf_url":"https://pure.uva.nl/ws/files/99959758/2021.eacl_main.176.pdf","source":{"id":"https://openalex.org/S4306400088","display_name":"UvA-DARE (University of Amsterdam)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I887064364","host_organization_name":"University of Amsterdam","host_organization_lineage":["https://openalex.org/I887064364"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Weber, L, Jumelet, J, Bruni, E & Hupkes, D 2021, Language Modelling as a Multi-Task Problem. in P Merlo, J Tiedemann & R Tsarfaty (eds), The 16th Conference of the European Chapter of the Association for Computational Linguistics : EACL 2021 : proceedings of the conference : April 19-23, 2021. Stroudsburg, PA, pp. 2049\u20132060, 16th Conference of the European Chapter of the Association for Computational Linguistics, 19/04/21. https://doi.org/10.18653/v1/2021.eacl-main.176","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:uvapub:oai:dare.uva.nl:publications/d8da817d-e365-464d-831f-cf637e7d282a","is_oa":true,"landing_page_url":"https://dare.uva.nl/personal/pure/en/publications/language-modelling-as-a-multitask-problem(d8da817d-e365-464d-831f-cf637e7d282a).html","pdf_url":null,"source":{"id":"https://openalex.org/S4306401843","display_name":"Data Archiving and Networked Services (DANS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1322597698","host_organization_name":"Royal Netherlands Academy of Arts and Sciences","host_organization_lineage":["https://openalex.org/I1322597698"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"The 16th Conference of the European Chapter of the Association for Computational Linguistics: EACL 2021 : proceedings of the conference : April 19-23, 2021","raw_type":"info:eu-repo/semantics/conferencepaper"},{"id":"doi:10.48550/arxiv.2101.11287","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2101.11287","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"},{"id":"mag:3121593933","is_oa":false,"landing_page_url":null,"pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":null}],"best_oa_location":{"id":"doi:10.18653/v1/2021.eacl-main.176","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2021.eacl-main.176","pdf_url":"https://aclanthology.org/2021.eacl-main.176.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 16th Conference of the European Chapter of the Association for Computational Linguistics: Main Volume","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.8399999737739563,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3121593933.pdf","grobid_xml":"https://content.openalex.org/works/W3121593933.grobid-xml"},"referenced_works_count":37,"referenced_works":["https://openalex.org/W1522920269","https://openalex.org/W1540511257","https://openalex.org/W1560550898","https://openalex.org/W1593222164","https://openalex.org/W1614862348","https://openalex.org/W1896424170","https://openalex.org/W2109606373","https://openalex.org/W2117130368","https://openalex.org/W2123257246","https://openalex.org/W2130903752","https://openalex.org/W2155541015","https://openalex.org/W2156267734","https://openalex.org/W2158899491","https://openalex.org/W2165698076","https://openalex.org/W2170563643","https://openalex.org/W2251329024","https://openalex.org/W2592170186","https://openalex.org/W2624871570","https://openalex.org/W2626792426","https://openalex.org/W2741937156","https://openalex.org/W2802158617","https://openalex.org/W2888329843","https://openalex.org/W2888922637","https://openalex.org/W2913340405","https://openalex.org/W2918996109","https://openalex.org/W2946417913","https://openalex.org/W2963341956","https://openalex.org/W2963751529","https://openalex.org/W2964117978","https://openalex.org/W2964303116","https://openalex.org/W2980113592","https://openalex.org/W3013286647","https://openalex.org/W3034672970","https://openalex.org/W3035219538","https://openalex.org/W3042795397","https://openalex.org/W3103520839","https://openalex.org/W3104240813"],"related_works":["https://openalex.org/W3154603286","https://openalex.org/W2043943145","https://openalex.org/W2963344980","https://openalex.org/W3089829989","https://openalex.org/W3196144092","https://openalex.org/W1518025116","https://openalex.org/W2999190900","https://openalex.org/W2107996423","https://openalex.org/W2904870187","https://openalex.org/W2139612797","https://openalex.org/W897316281","https://openalex.org/W2898289269","https://openalex.org/W3186846719","https://openalex.org/W2906689385","https://openalex.org/W2497030462","https://openalex.org/W3096655658","https://openalex.org/W2185307709","https://openalex.org/W1561983327","https://openalex.org/W3114219454","https://openalex.org/W3099652303"],"abstract_inverted_index":{"In":[0],"this":[1,91],"paper,":[2],"we":[3,31,49],"propose":[4],"to":[5,37,105],"study":[6],"language":[7,34,55,86],"modelling":[8],"as":[9,57],"a":[10,72],"multi-task":[11,41,73],"problem,":[12],"bringing":[13],"together":[14],"three":[15,111],"strands":[16],"of":[17,40,54,63,80,85],"research:":[18],"multitask":[19,96],"learning,":[20,97],"linguistics,":[21],"and":[22,99,102],"interpretability.":[23],"Based":[24],"on":[25],"hypotheses":[26],"derived":[27],"from":[28],"linguistic":[29,61],"theory,":[30],"investigate":[32],"whether":[33],"models":[35,56],"adhere":[36],"learning":[38,42],"principles":[39],"during":[43],"training.":[44],"To":[45],"showcase":[46],"the":[47,51,60,78,81],"idea,":[48],"analyse":[50],"generalisation":[52],"behaviour":[53],"they":[58],"learn":[59],"concept":[62],"Negative":[64],"Polarity":[65],"Items":[66],"(NPIs).":[67],"Our":[68],"experiments":[69],"demonstrate":[70],"that":[71,90],"setting":[74],"naturally":[75],"emerges":[76],"within":[77],"objective":[79],"more":[82],"general":[83],"task":[84],"modelling.":[87],"We":[88],"argue":[89],"insight":[92],"is":[93],"valuable":[94],"for":[95],"linguistics":[98],"interpretability":[100],"research":[101],"can":[103],"lead":[104],"exciting":[106],"new":[107],"findings":[108],"in":[109],"all":[110],"domains.":[112]},"counts_by_year":[],"updated_date":"2026-03-17T17:19:04.345684","created_date":"2025-10-10T00:00:00"}
