{"id":"https://openalex.org/W4385567541","doi":"https://doi.org/10.1145/3580305.3599301","title":"Deep Encoders with Auxiliary Parameters for Extreme Classification","display_name":"Deep Encoders with Auxiliary Parameters for Extreme Classification","publication_year":2023,"publication_date":"2023-08-04","ids":{"openalex":"https://openalex.org/W4385567541","doi":"https://doi.org/10.1145/3580305.3599301"},"language":"en","primary_location":{"id":"doi:10.1145/3580305.3599301","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3580305.3599301","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5081553743","display_name":"Kunal Dahiya","orcid":"https://orcid.org/0000-0002-1500-0295"},"institutions":[{"id":"https://openalex.org/I68891433","display_name":"Indian Institute of Technology Delhi","ror":"https://ror.org/049tgcd06","country_code":"IN","type":"education","lineage":["https://openalex.org/I68891433"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Kunal Dahiya","raw_affiliation_strings":["IIT Delhi, New Delhi, India"],"affiliations":[{"raw_affiliation_string":"IIT Delhi, New Delhi, India","institution_ids":["https://openalex.org/I68891433"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101941000","display_name":"Sachin Yadav","orcid":"https://orcid.org/0000-0003-0048-1118"},"institutions":[{"id":"https://openalex.org/I4210124949","display_name":"Microsoft Research (India)","ror":"https://ror.org/02w7f3w92","country_code":"IN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210124949"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Sachin Yadav","raw_affiliation_strings":["Microsoft Research, Bangalore, India"],"affiliations":[{"raw_affiliation_string":"Microsoft Research, Bangalore, India","institution_ids":["https://openalex.org/I4210124949"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103258794","display_name":"S. L. Sondhi","orcid":"https://orcid.org/0009-0007-8146-2854"},"institutions":[{"id":"https://openalex.org/I68891433","display_name":"Indian Institute of Technology Delhi","ror":"https://ror.org/049tgcd06","country_code":"IN","type":"education","lineage":["https://openalex.org/I68891433"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Sushant Sondhi","raw_affiliation_strings":["IIT Delhi, New Delhi, India"],"affiliations":[{"raw_affiliation_string":"IIT Delhi, New Delhi, India","institution_ids":["https://openalex.org/I68891433"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059937402","display_name":"Deepak Saini","orcid":"https://orcid.org/0000-0002-6057-4351"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]},{"id":"https://openalex.org/I4210108985","display_name":"Bellevue Hospital Center","ror":"https://ror.org/01ky34z31","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I1283621791","https://openalex.org/I4210086933","https://openalex.org/I4210108985"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Deepak Saini","raw_affiliation_strings":["Microsoft, Bellevue, WA, USA"],"affiliations":[{"raw_affiliation_string":"Microsoft, Bellevue, WA, USA","institution_ids":["https://openalex.org/I1290206253","https://openalex.org/I4210108985"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004409285","display_name":"Sonu Mehta","orcid":"https://orcid.org/0000-0003-1654-3766"},"institutions":[{"id":"https://openalex.org/I68891433","display_name":"Indian Institute of Technology Delhi","ror":"https://ror.org/049tgcd06","country_code":"IN","type":"education","lineage":["https://openalex.org/I68891433"]},{"id":"https://openalex.org/I4210124949","display_name":"Microsoft Research (India)","ror":"https://ror.org/02w7f3w92","country_code":"IN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210124949"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Sonu Mehta","raw_affiliation_strings":["Microsoft Research &amp; IIT Delhi, Bangalore &amp; New Delhi, India"],"affiliations":[{"raw_affiliation_string":"Microsoft Research &amp; IIT Delhi, Bangalore &amp; New Delhi, India","institution_ids":["https://openalex.org/I4210124949","https://openalex.org/I68891433"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074199611","display_name":"Jian Jiao","orcid":"https://orcid.org/0000-0003-4779-9588"},"institutions":[{"id":"https://openalex.org/I4210108985","display_name":"Bellevue Hospital Center","ror":"https://ror.org/01ky34z31","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I1283621791","https://openalex.org/I4210086933","https://openalex.org/I4210108985"]},{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jian Jiao","raw_affiliation_strings":["Microsoft, Bellevue, WA, USA"],"affiliations":[{"raw_affiliation_string":"Microsoft, Bellevue, WA, USA","institution_ids":["https://openalex.org/I1290206253","https://openalex.org/I4210108985"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001668151","display_name":"Sumeet Agarwal","orcid":"https://orcid.org/0000-0002-5714-3921"},"institutions":[{"id":"https://openalex.org/I68891433","display_name":"Indian Institute of Technology Delhi","ror":"https://ror.org/049tgcd06","country_code":"IN","type":"education","lineage":["https://openalex.org/I68891433"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Sumeet Agarwal","raw_affiliation_strings":["IIT Delhi, New Delhi, India"],"affiliations":[{"raw_affiliation_string":"IIT Delhi, New Delhi, India","institution_ids":["https://openalex.org/I68891433"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081725635","display_name":"Purushottam Kar","orcid":"https://orcid.org/0000-0003-2096-5267"},"institutions":[{"id":"https://openalex.org/I94234084","display_name":"Indian Institute of Technology Kanpur","ror":"https://ror.org/05pjsgx75","country_code":"IN","type":"education","lineage":["https://openalex.org/I94234084"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Purushottam Kar","raw_affiliation_strings":["IIT Kanpur, Kanpur, India"],"affiliations":[{"raw_affiliation_string":"IIT Kanpur, Kanpur, India","institution_ids":["https://openalex.org/I94234084"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5051880496","display_name":"Manik Varma","orcid":null},"institutions":[{"id":"https://openalex.org/I4210124949","display_name":"Microsoft Research (India)","ror":"https://ror.org/02w7f3w92","country_code":"IN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210124949"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Manik Varma","raw_affiliation_strings":["Microsoft Research, Bangalore, India"],"affiliations":[{"raw_affiliation_string":"Microsoft Research, Bangalore, India","institution_ids":["https://openalex.org/I4210124949"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5081553743"],"corresponding_institution_ids":["https://openalex.org/I68891433"],"apc_list":null,"apc_paid":null,"fwci":0.8884,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.78986293,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"358","last_page":"367"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7875967025756836},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.7706353664398193},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.6912287473678589},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5944735407829285},{"id":"https://openalex.org/keywords/modular-design","display_name":"Modular design","score":0.5917089581489563},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5477015376091003},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.5304833054542542},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5162594318389893},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.48390111327171326},{"id":"https://openalex.org/keywords/autoencoder","display_name":"Autoencoder","score":0.4838827848434448},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.46488165855407715},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4470128118991852},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4189671277999878},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.34069788455963135},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.3266606628894806},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.07520940899848938},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.07418179512023926},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.07060492038726807}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7875967025756836},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.7706353664398193},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.6912287473678589},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5944735407829285},{"id":"https://openalex.org/C101468663","wikidata":"https://www.wikidata.org/wiki/Q1620158","display_name":"Modular design","level":2,"score":0.5917089581489563},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5477015376091003},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.5304833054542542},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5162594318389893},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.48390111327171326},{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.4838827848434448},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.46488165855407715},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4470128118991852},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4189671277999878},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.34069788455963135},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.3266606628894806},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.07520940899848938},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.07418179512023926},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.07060492038726807},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3580305.3599301","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3580305.3599301","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W1834987204","https://openalex.org/W1892593501","https://openalex.org/W2068074736","https://openalex.org/W2359108789","https://openalex.org/W2362855512","https://openalex.org/W2520348554","https://openalex.org/W2744136723","https://openalex.org/W2782759081","https://openalex.org/W2788125153","https://openalex.org/W2906963924","https://openalex.org/W2921113176","https://openalex.org/W2945456403","https://openalex.org/W2963469388","https://openalex.org/W2963502184","https://openalex.org/W2964240234","https://openalex.org/W2999508688","https://openalex.org/W3035524453","https://openalex.org/W3037422790","https://openalex.org/W3080802002","https://openalex.org/W3093655911","https://openalex.org/W3094444847","https://openalex.org/W3099700870","https://openalex.org/W3102124616","https://openalex.org/W3114079967","https://openalex.org/W3152616003","https://openalex.org/W3168875417","https://openalex.org/W3169488402","https://openalex.org/W3177232285","https://openalex.org/W4288728031","https://openalex.org/W4312697098","https://openalex.org/W6601944498","https://openalex.org/W6818795685"],"related_works":["https://openalex.org/W2669956259","https://openalex.org/W4287995534","https://openalex.org/W2998168123","https://openalex.org/W2939353110","https://openalex.org/W2897995864","https://openalex.org/W4380075502","https://openalex.org/W4327774331","https://openalex.org/W2292254049","https://openalex.org/W4287178339","https://openalex.org/W3165463024"],"abstract_inverted_index":{"The":[0,95,156],"task":[1],"of":[2,17,43,91],"annotating":[3],"a":[4,14,39,44,48,58,99],"data":[5,72],"point":[6],"with":[7,107,126],"labels":[8,18,129],"most":[9],"relevant":[10],"to":[11,21,61,82,124,136],"it":[12,165],"from":[13],"large":[15],"universe":[16],"is":[19,183],"referred":[20],"as":[22],"Extreme":[23],"Classification":[24],"(XC).":[25],"State-of-the-art":[26],"XC":[27,69,114,148],"methods":[28,149],"have":[29],"applications":[30],"in":[31,57,68,176],"ranking,":[32],"recommendation,":[33],"and":[34,36,47,74,119,130,138,152,162],"tagging":[35],"mostly":[37],"employ":[38],"combination":[40],"architecture":[41],"comprised":[42],"deep":[45,147],"encoder":[46,84,105,169],"high-capacity":[49],"classifier.":[50],"These":[51],"two":[52],"components":[53],"are":[54,134],"often":[55],"trained":[56],"modular":[59],"fashion":[60],"conserve":[62],"compute.":[63],"This":[64],"paper":[65,96,157],"shows":[66,163],"that":[67,103,133,164],"settings":[70],"where":[71],"paucity":[73],"semantic":[75],"gap":[76],"issues":[77],"abound,":[78],"this":[79],"can":[80,122],"lead":[81],"suboptimal":[83],"training":[85,106,170,174],"which":[86],"negatively":[87],"affects":[88],"the":[89,92,120],"performance":[90],"overall":[93],"architecture.":[94],"then":[97],"proposes":[98],"lightweight":[100],"alternative":[101],"DEXA":[102,111,160,182],"augments":[104],"auxiliary":[108],"parameters.":[109],"Incorporating":[110],"into":[112],"existing":[113,146,172],"architectures":[115],"requires":[116],"minimal":[117],"modifications":[118],"method":[121],"scale":[123],"datasets":[125],"40":[127],"million":[128],"offer":[131],"predictions":[132],"up":[135],"6%":[137],"15%":[139],"more":[140],"accurate":[141],"than":[142,171],"embeddings":[143],"offered":[144],"by":[145],"on":[150],"benchmark":[151],"proprietary":[153],"datasets,":[154],"respectively.":[155],"also":[158],"analyzes":[159],"theoretically":[161],"offers":[166],"provably":[167],"superior":[168],"Siamese":[173],"strategies":[175],"certain":[177],"realizable":[178],"settings.":[179],"Code":[180],"for":[181],"available":[184],"at":[185],"https://github.com/Extreme-classification/dexa.":[186]},"counts_by_year":[{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":1}],"updated_date":"2026-03-09T08:58:05.943551","created_date":"2025-10-10T00:00:00"}
