{"id":"https://openalex.org/W3012804686","doi":"https://doi.org/10.1109/ijcnn48605.2020.9207139","title":"Learned Weight Sharing for Deep Multi-Task Learning by Natural Evolution Strategy and Stochastic Gradient Descent","display_name":"Learned Weight Sharing for Deep Multi-Task Learning by Natural Evolution Strategy and Stochastic Gradient Descent","publication_year":2020,"publication_date":"2020-07-01","ids":{"openalex":"https://openalex.org/W3012804686","doi":"https://doi.org/10.1109/ijcnn48605.2020.9207139","mag":"3012804686"},"language":"en","primary_location":{"id":"doi:10.1109/ijcnn48605.2020.9207139","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn48605.2020.9207139","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2003.10159","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5001694973","display_name":"Jonas Prellberg","orcid":null},"institutions":[{"id":"https://openalex.org/I129877168","display_name":"Carl von Ossietzky Universit\u00e4t Oldenburg","ror":"https://ror.org/033n9gh91","country_code":"DE","type":"education","lineage":["https://openalex.org/I129877168"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Jonas Prellberg","raw_affiliation_strings":["Dept. of Computer Science, University of Oldenburg, Oldenburg, Germany","Univ. of Oldenburg"],"affiliations":[{"raw_affiliation_string":"Dept. of Computer Science, University of Oldenburg, Oldenburg, Germany","institution_ids":["https://openalex.org/I129877168"]},{"raw_affiliation_string":"Univ. of Oldenburg","institution_ids":["https://openalex.org/I129877168"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103020462","display_name":"Oliver Kr\u00e4mer","orcid":"https://orcid.org/0000-0001-7607-1700"},"institutions":[{"id":"https://openalex.org/I129877168","display_name":"Carl von Ossietzky Universit\u00e4t Oldenburg","ror":"https://ror.org/033n9gh91","country_code":"DE","type":"education","lineage":["https://openalex.org/I129877168"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Oliver Kramer","raw_affiliation_strings":["Dept. of Computer Science, University of Oldenburg, Oldenburg, Germany","Univ. of Oldenburg"],"affiliations":[{"raw_affiliation_string":"Dept. of Computer Science, University of Oldenburg, Oldenburg, Germany","institution_ids":["https://openalex.org/I129877168"]},{"raw_affiliation_string":"Univ. of Oldenburg","institution_ids":["https://openalex.org/I129877168"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5001694973"],"corresponding_institution_ids":["https://openalex.org/I129877168"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0287763,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12676","display_name":"Machine Learning and ELM","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.7550127506256104},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7393632531166077},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6797980070114136},{"id":"https://openalex.org/keywords/differentiable-function","display_name":"Differentiable function","score":0.634458601474762},{"id":"https://openalex.org/keywords/stochastic-gradient-descent","display_name":"Stochastic gradient descent","score":0.6229813694953918},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5821270942687988},{"id":"https://openalex.org/keywords/gradient-descent","display_name":"Gradient descent","score":0.5736328959465027},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5478271842002869},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4878073036670685},{"id":"https://openalex.org/keywords/multi-task-learning","display_name":"Multi-task learning","score":0.4525175094604492},{"id":"https://openalex.org/keywords/layer","display_name":"Layer (electronics)","score":0.4477861821651459},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.26478031277656555},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.12629660964012146}],"concepts":[{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.7550127506256104},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7393632531166077},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6797980070114136},{"id":"https://openalex.org/C202615002","wikidata":"https://www.wikidata.org/wiki/Q783507","display_name":"Differentiable function","level":2,"score":0.634458601474762},{"id":"https://openalex.org/C206688291","wikidata":"https://www.wikidata.org/wiki/Q7617819","display_name":"Stochastic gradient descent","level":3,"score":0.6229813694953918},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5821270942687988},{"id":"https://openalex.org/C153258448","wikidata":"https://www.wikidata.org/wiki/Q1199743","display_name":"Gradient descent","level":3,"score":0.5736328959465027},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5478271842002869},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4878073036670685},{"id":"https://openalex.org/C28006648","wikidata":"https://www.wikidata.org/wiki/Q6934509","display_name":"Multi-task learning","level":3,"score":0.4525175094604492},{"id":"https://openalex.org/C2779227376","wikidata":"https://www.wikidata.org/wiki/Q6505497","display_name":"Layer (electronics)","level":2,"score":0.4477861821651459},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.26478031277656555},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.12629660964012146},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/ijcnn48605.2020.9207139","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn48605.2020.9207139","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2003.10159","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2003.10159","pdf_url":"https://arxiv.org/pdf/2003.10159","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"mag:3012804686","is_oa":true,"landing_page_url":"http://arxiv.org/pdf/2003.10159.pdf","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"doi:10.48550/arxiv.2003.10159","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2003.10159","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2003.10159","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2003.10159","pdf_url":"https://arxiv.org/pdf/2003.10159","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"score":0.47999998927116394,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3012804686.pdf","grobid_xml":"https://content.openalex.org/works/W3012804686.grobid-xml"},"referenced_works_count":34,"referenced_works":["https://openalex.org/W1677182931","https://openalex.org/W1896424170","https://openalex.org/W2142508340","https://openalex.org/W2149933564","https://openalex.org/W2151965738","https://openalex.org/W2194321275","https://openalex.org/W2194775991","https://openalex.org/W2295072214","https://openalex.org/W2549401308","https://openalex.org/W2577183329","https://openalex.org/W2583761661","https://openalex.org/W2617039999","https://openalex.org/W2734358244","https://openalex.org/W2902986194","https://openalex.org/W2913340405","https://openalex.org/W2945445935","https://openalex.org/W2948894819","https://openalex.org/W2963393838","https://openalex.org/W2963704251","https://openalex.org/W2963877604","https://openalex.org/W2964118262","https://openalex.org/W2964121744","https://openalex.org/W6628707872","https://openalex.org/W6631190155","https://openalex.org/W6682132143","https://openalex.org/W6682262322","https://openalex.org/W6704665273","https://openalex.org/W6732467815","https://openalex.org/W6732735668","https://openalex.org/W6738491513","https://openalex.org/W6745240403","https://openalex.org/W6745642626","https://openalex.org/W6763197128","https://openalex.org/W6763325255"],"related_works":["https://openalex.org/W3091077821","https://openalex.org/W3101155878","https://openalex.org/W2915446515","https://openalex.org/W2989826725","https://openalex.org/W3006531612","https://openalex.org/W3129958428","https://openalex.org/W3033503043","https://openalex.org/W2149464712","https://openalex.org/W3080901109","https://openalex.org/W2951941802","https://openalex.org/W3162492846","https://openalex.org/W3036917029","https://openalex.org/W2437447943","https://openalex.org/W3028262105","https://openalex.org/W2735995851","https://openalex.org/W2294805292","https://openalex.org/W2998093422","https://openalex.org/W2466795","https://openalex.org/W3101654339","https://openalex.org/W3042303144"],"abstract_inverted_index":{"In":[0,42],"deep":[1],"multi-task":[2,123],"learning,":[3],"weights":[4,23,65,105],"of":[5,64,89],"task-specific":[6,40,67,101],"networks":[7,102],"are":[8,100],"shared":[9,62],"between":[10,26,60],"tasks":[11],"to":[12,24,30,56],"improve":[13],"performance":[14],"on":[15,121],"each":[16],"single":[17],"one.":[18],"Since":[19],"the":[20,58,71,76,80],"question,":[21],"which":[22],"share":[25,35,104],"layers,":[27],"is":[28],"difficult":[29],"answer,":[31],"human-designed":[32],"architectures":[33],"often":[34],"everything":[36],"but":[37,106],"a":[38,61,87],"last":[39],"layer.":[41],"many":[43],"cases,":[44],"this":[45],"simplistic":[46],"approach":[47],"severely":[48],"limits":[49],"performance.":[50],"Instead,":[51],"we":[52],"propose":[53],"an":[54],"algorithm":[55],"learn":[57],"assignment":[59,73],"set":[63],"and":[66,74,93,117],"layers.":[68],"To":[69],"optimize":[70],"non-differentiable":[72],"at":[75],"same":[77],"time":[78],"train":[79],"differentiable":[81],"weights,":[82],"learning":[83,124],"takes":[84],"place":[85],"via":[86],"combination":[88],"natural":[90],"evolution":[91],"strategy":[92],"stochastic":[94],"gradient":[95],"descent.":[96],"The":[97],"end":[98],"result":[99],"that":[103],"allow":[107],"independent":[108],"inference.":[109],"They":[110],"achieve":[111],"lower":[112],"test":[113],"errors":[114],"than":[115],"baselines":[116],"methods":[118],"from":[119],"literature":[120],"three":[122],"datasets.":[125]},"counts_by_year":[],"updated_date":"2026-03-25T13:04:00.132906","created_date":"2025-10-10T00:00:00"}
