{"id":"https://openalex.org/W2900533563","doi":"https://doi.org/10.1609/aaai.v33i01.33016949","title":"A Hierarchical Multi-Task Approach for Learning Embeddings from Semantic Tasks","display_name":"A Hierarchical Multi-Task Approach for Learning Embeddings from Semantic Tasks","publication_year":2019,"publication_date":"2019-07-17","ids":{"openalex":"https://openalex.org/W2900533563","doi":"https://doi.org/10.1609/aaai.v33i01.33016949","mag":"2900533563"},"language":"en","primary_location":{"id":"doi:10.1609/aaai.v33i01.33016949","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v33i01.33016949","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/4673/4551","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://ojs.aaai.org/index.php/AAAI/article/download/4673/4551","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5049805631","display_name":"Victor Sanh","orcid":null},"institutions":[{"id":"https://openalex.org/I4387154989","display_name":"Hugging Face","ror":"https://ror.org/02grspc61","country_code":null,"type":"company","lineage":["https://openalex.org/I4387154989"]},{"id":"https://openalex.org/I4210136376","display_name":"FACE Foundation","ror":"https://ror.org/04121g745","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I4210136376"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Victor Sanh","raw_affiliation_strings":["Hugging Face"],"affiliations":[{"raw_affiliation_string":"Hugging Face","institution_ids":["https://openalex.org/I4210136376","https://openalex.org/I4387154989"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107899645","display_name":"Thomas Wolf","orcid":null},"institutions":[{"id":"https://openalex.org/I4387154989","display_name":"Hugging Face","ror":"https://ror.org/02grspc61","country_code":null,"type":"company","lineage":["https://openalex.org/I4387154989"]},{"id":"https://openalex.org/I4210136376","display_name":"FACE Foundation","ror":"https://ror.org/04121g745","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I4210136376"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Thomas Wolf","raw_affiliation_strings":["Hugging Face"],"affiliations":[{"raw_affiliation_string":"Hugging Face","institution_ids":["https://openalex.org/I4210136376","https://openalex.org/I4387154989"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5037310413","display_name":"Sebastian Ruder","orcid":null},"institutions":[{"id":"https://openalex.org/I181231927","display_name":"National University of Ireland","ror":"https://ror.org/00shsf120","country_code":"IE","type":"education","lineage":["https://openalex.org/I181231927"]}],"countries":["IE"],"is_corresponding":false,"raw_author_name":"Sebastian Ruder","raw_affiliation_strings":["National University of Ireland","National University of Ireland,"],"affiliations":[{"raw_affiliation_string":"National University of Ireland","institution_ids":["https://openalex.org/I181231927"]},{"raw_affiliation_string":"National University of Ireland,","institution_ids":["https://openalex.org/I181231927"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5049805631"],"corresponding_institution_ids":["https://openalex.org/I4210136376","https://openalex.org/I4387154989"],"apc_list":null,"apc_paid":null,"fwci":3.9979,"has_fulltext":true,"cited_by_count":35,"citation_normalized_percentile":{"value":0.94244726,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":"33","issue":"01","first_page":"6949","last_page":"6956"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9866999983787537,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8620301485061646},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.7619448900222778},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6512430906295776},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6463404893875122},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.6423467993736267},{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.5999428033828735},{"id":"https://openalex.org/keywords/hierarchical-database-model","display_name":"Hierarchical database model","score":0.49138155579566956},{"id":"https://openalex.org/keywords/top-down-and-bottom-up-design","display_name":"Top-down and bottom-up design","score":0.44515782594680786},{"id":"https://openalex.org/keywords/relationship-extraction","display_name":"Relationship extraction","score":0.4359495937824249},{"id":"https://openalex.org/keywords/natural-language-understanding","display_name":"Natural language understanding","score":0.4286845922470093},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.33515894412994385},{"id":"https://openalex.org/keywords/information-extraction","display_name":"Information extraction","score":0.30415916442871094},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.24233028292655945},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.10042741894721985}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8620301485061646},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.7619448900222778},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6512430906295776},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6463404893875122},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.6423467993736267},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.5999428033828735},{"id":"https://openalex.org/C144986985","wikidata":"https://www.wikidata.org/wiki/Q871236","display_name":"Hierarchical database model","level":2,"score":0.49138155579566956},{"id":"https://openalex.org/C135798126","wikidata":"https://www.wikidata.org/wiki/Q2167279","display_name":"Top-down and bottom-up design","level":2,"score":0.44515782594680786},{"id":"https://openalex.org/C153604712","wikidata":"https://www.wikidata.org/wiki/Q7310755","display_name":"Relationship extraction","level":3,"score":0.4359495937824249},{"id":"https://openalex.org/C2779439875","wikidata":"https://www.wikidata.org/wiki/Q1078276","display_name":"Natural language understanding","level":3,"score":0.4286845922470093},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.33515894412994385},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.30415916442871094},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.24233028292655945},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.10042741894721985},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1609/aaai.v33i01.33016949","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v33i01.33016949","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/4673/4551","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:1811.06031","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1811.06031","pdf_url":"https://arxiv.org/pdf/1811.06031","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.1811.06031","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1811.06031","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"},{"id":"mag:2900533563","is_oa":false,"landing_page_url":null,"pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":null}],"best_oa_location":{"id":"doi:10.1609/aaai.v33i01.33016949","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v33i01.33016949","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/4673/4551","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.8100000023841858,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2900533563.pdf","grobid_xml":"https://content.openalex.org/works/W2900533563.grobid-xml"},"referenced_works_count":59,"referenced_works":["https://openalex.org/W36434594","https://openalex.org/W1614862348","https://openalex.org/W1899794420","https://openalex.org/W2060277733","https://openalex.org/W2077054525","https://openalex.org/W2103076621","https://openalex.org/W2124700572","https://openalex.org/W2134033474","https://openalex.org/W2147880316","https://openalex.org/W2155069789","https://openalex.org/W2155247542","https://openalex.org/W2179519966","https://openalex.org/W2229639163","https://openalex.org/W2250539671","https://openalex.org/W2251035762","https://openalex.org/W2252031764","https://openalex.org/W2293004735","https://openalex.org/W2296073425","https://openalex.org/W2296283641","https://openalex.org/W2407338347","https://openalex.org/W2516255829","https://openalex.org/W2556468274","https://openalex.org/W2592170186","https://openalex.org/W2610858497","https://openalex.org/W2612953412","https://openalex.org/W2624871570","https://openalex.org/W2738152205","https://openalex.org/W2740462959","https://openalex.org/W2740663516","https://openalex.org/W2741956709","https://openalex.org/W2752172973","https://openalex.org/W2784231336","https://openalex.org/W2786685006","https://openalex.org/W2787560479","https://openalex.org/W2788528628","https://openalex.org/W2797498228","https://openalex.org/W2799124508","https://openalex.org/W2799125718","https://openalex.org/W2809324505","https://openalex.org/W2913340405","https://openalex.org/W2949563612","https://openalex.org/W2950726992","https://openalex.org/W2963140597","https://openalex.org/W2963918774","https://openalex.org/W2963925965","https://openalex.org/W2964094426","https://openalex.org/W3209042722","https://openalex.org/W6601502966","https://openalex.org/W6629028937","https://openalex.org/W6682939441","https://openalex.org/W6685810106","https://openalex.org/W6691431627","https://openalex.org/W6696904280","https://openalex.org/W6697155078","https://openalex.org/W6698204877","https://openalex.org/W6729596854","https://openalex.org/W6748634344","https://openalex.org/W6759193872","https://openalex.org/W6834922076"],"related_works":["https://openalex.org/W2963168538","https://openalex.org/W2963341956","https://openalex.org/W2250539671","https://openalex.org/W2897171319","https://openalex.org/W2786685006","https://openalex.org/W48813473","https://openalex.org/W1975759955","https://openalex.org/W2006710607","https://openalex.org/W2905190525","https://openalex.org/W3105747907","https://openalex.org/W168804263","https://openalex.org/W2251013762","https://openalex.org/W3198439322","https://openalex.org/W2799256867","https://openalex.org/W2556984224","https://openalex.org/W3167926051","https://openalex.org/W2895466885","https://openalex.org/W2964330417","https://openalex.org/W2976395280","https://openalex.org/W3184218698"],"abstract_inverted_index":{"Much":[0],"effort":[1],"has":[2,44],"been":[3],"devoted":[4],"to":[5,13,78,165,179],"evaluate":[6],"whether":[7],"multi-task":[8,42,59],"learning":[9,43,60],"can":[10,18],"be":[11,19],"leveraged":[12],"learn":[14],"rich":[15],"representations":[16,149],"that":[17,158],"used":[20],"in":[21,40,57,74],"various":[22],"Natural":[23],"Language":[24],"Processing":[25],"(NLP)":[26],"down-stream":[27],"applications.":[28],"However,":[29],"there":[30],"is":[31,72],"still":[32],"a":[33,45,53,58,63,75,85,115,144],"lack":[34],"of":[35,37,65,87,95,106,117,146,153,169,175],"understanding":[36],"the":[38,92,96,103,107,154,163,166,170,172,176],"settings":[39],"which":[41],"significant":[46],"effect.":[47],"In":[48],"this":[49],"work,":[50],"we":[51,160],"introduce":[52,79],"hierarchical":[54,76,140],"model":[55,71,97,110],"trained":[56,73],"setup":[61],"on":[62,114],"set":[64,86,145],"carefully":[66],"selected":[67],"semantic":[68,148,183],"tasks.":[69],"The":[70,139],"fashion":[77],"an":[80],"inductive":[81],"bias":[82],"by":[83],"supervising":[84],"low":[88],"level":[89],"tasks":[90,101],"at":[91,102,150],"bottom":[93,164],"layers":[94,105,152,168,177],"and":[98,126],"more":[99,181],"complex":[100,182],"top":[104,167],"model.":[108,155],"This":[109],"achieves":[111],"state-of-the-art":[112],"results":[113],"number":[116],"tasks,":[118],"namely":[119],"Named":[120],"Entity":[121,123],"Recognition,":[122],"Mention":[124],"Detection":[125],"Relation":[127],"Extraction":[128],"without":[129],"hand-engineered":[130],"features":[131],"or":[132],"external":[133],"NLP":[134],"tools":[135],"like":[136],"syntactic":[137],"parsers.":[138],"training":[141],"supervision":[142],"induces":[143],"shared":[147],"lower":[151],"We":[156],"show":[157],"as":[159],"move":[161],"from":[162],"model,":[171],"hidden":[173],"states":[174],"tend":[178],"represent":[180],"information.":[184]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":6},{"year":2021,"cited_by_count":6},{"year":2020,"cited_by_count":8},{"year":2019,"cited_by_count":10}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
