{"id":"https://openalex.org/W3199446656","doi":"https://doi.org/10.1109/ijcnn52387.2021.9534452","title":"Bridging the Gap of Dimensions in Distillation: Understanding the knowledge transfer between different-dimensional semantic spaces","display_name":"Bridging the Gap of Dimensions in Distillation: Understanding the knowledge transfer between different-dimensional semantic spaces","publication_year":2021,"publication_date":"2021-07-18","ids":{"openalex":"https://openalex.org/W3199446656","doi":"https://doi.org/10.1109/ijcnn52387.2021.9534452","mag":"3199446656"},"language":"en","primary_location":{"id":"doi:10.1109/ijcnn52387.2021.9534452","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn52387.2021.9534452","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100622932","display_name":"Zhiyuan Ma","orcid":"https://orcid.org/0000-0003-2153-5824"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhiyuan Ma","raw_affiliation_strings":["School of Electronic Information and Electrical Engineering Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic Information and Electrical Engineering Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001006462","display_name":"Ziyue Song","orcid":null},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ziyue Song","raw_affiliation_strings":["School of Electronic Information and Electrical Engineering Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic Information and Electrical Engineering Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025780527","display_name":"Haodong Zhao","orcid":"https://orcid.org/0000-0002-4405-1649"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haodong Zhao","raw_affiliation_strings":["School of Electronic Information and Electrical Engineering Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic Information and Electrical Engineering Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004609196","display_name":"Kui Meng","orcid":"https://orcid.org/0000-0001-9443-9716"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kui Meng","raw_affiliation_strings":["School of Electronic Information and Electrical Engineering Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic Information and Electrical Engineering Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5085695760","display_name":"Gongshen Liu","orcid":"https://orcid.org/0000-0001-5194-1570"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Gongshen Liu","raw_affiliation_strings":["School of Electronic Information and Electrical Engineering Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic Information and Electrical Engineering Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5100622932"],"corresponding_institution_ids":["https://openalex.org/I183067930"],"apc_list":null,"apc_paid":null,"fwci":0.136,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.55024907,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"80","issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9955000281333923,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6598008871078491},{"id":"https://openalex.org/keywords/bridging","display_name":"Bridging (networking)","score":0.5303307771682739},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5036515593528748},{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.49738839268684387},{"id":"https://openalex.org/keywords/dimension","display_name":"Dimension (graph theory)","score":0.47594761848449707},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.45406267046928406},{"id":"https://openalex.org/keywords/semantic-space","display_name":"Semantic space","score":0.44016772508621216},{"id":"https://openalex.org/keywords/divergence","display_name":"Divergence (linguistics)","score":0.4375995695590973},{"id":"https://openalex.org/keywords/distillation","display_name":"Distillation","score":0.4347439110279083},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4258372187614441},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.42496681213378906},{"id":"https://openalex.org/keywords/euclidean-space","display_name":"Euclidean space","score":0.41499632596969604},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4127427935600281},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.3666486144065857},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.18234971165657043}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6598008871078491},{"id":"https://openalex.org/C174348530","wikidata":"https://www.wikidata.org/wiki/Q188635","display_name":"Bridging (networking)","level":2,"score":0.5303307771682739},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5036515593528748},{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.49738839268684387},{"id":"https://openalex.org/C33676613","wikidata":"https://www.wikidata.org/wiki/Q13415176","display_name":"Dimension (graph theory)","level":2,"score":0.47594761848449707},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.45406267046928406},{"id":"https://openalex.org/C2986420190","wikidata":"https://www.wikidata.org/wiki/Q39045939","display_name":"Semantic space","level":2,"score":0.44016772508621216},{"id":"https://openalex.org/C207390915","wikidata":"https://www.wikidata.org/wiki/Q1230525","display_name":"Divergence (linguistics)","level":2,"score":0.4375995695590973},{"id":"https://openalex.org/C204030448","wikidata":"https://www.wikidata.org/wiki/Q101017","display_name":"Distillation","level":2,"score":0.4347439110279083},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4258372187614441},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.42496681213378906},{"id":"https://openalex.org/C186450821","wikidata":"https://www.wikidata.org/wiki/Q17295","display_name":"Euclidean space","level":2,"score":0.41499632596969604},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4127427935600281},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3666486144065857},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.18234971165657043},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ijcnn52387.2021.9534452","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn52387.2021.9534452","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.8399999737739563,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[{"id":"https://openalex.org/G2863268074","display_name":null,"funder_award_id":"61772337,U1736207","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":44,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W1591801644","https://openalex.org/W1690739335","https://openalex.org/W1724438581","https://openalex.org/W1821462560","https://openalex.org/W1832693441","https://openalex.org/W1902237438","https://openalex.org/W2014902591","https://openalex.org/W2070246124","https://openalex.org/W2114524997","https://openalex.org/W2160660844","https://openalex.org/W2163455955","https://openalex.org/W2251939518","https://openalex.org/W2561238782","https://openalex.org/W2739879705","https://openalex.org/W2741613777","https://openalex.org/W2803023299","https://openalex.org/W2904759072","https://openalex.org/W2962965870","https://openalex.org/W2963350559","https://openalex.org/W2963403868","https://openalex.org/W2963736842","https://openalex.org/W2963982496","https://openalex.org/W2964118293","https://openalex.org/W2964121744","https://openalex.org/W2964222566","https://openalex.org/W2995607862","https://openalex.org/W3091643389","https://openalex.org/W3105966348","https://openalex.org/W4385245566","https://openalex.org/W6631190155","https://openalex.org/W6635446068","https://openalex.org/W6637551013","https://openalex.org/W6637709462","https://openalex.org/W6638523607","https://openalex.org/W6691459498","https://openalex.org/W6718212895","https://openalex.org/W6726275242","https://openalex.org/W6730179637","https://openalex.org/W6739901393","https://openalex.org/W6751751081","https://openalex.org/W6757123339","https://openalex.org/W6768086466","https://openalex.org/W6769906912"],"related_works":["https://openalex.org/W2905433371","https://openalex.org/W4361193272","https://openalex.org/W4310278675","https://openalex.org/W2806259446","https://openalex.org/W2963326959","https://openalex.org/W4312407344","https://openalex.org/W4384115502","https://openalex.org/W4226258012","https://openalex.org/W4383681494","https://openalex.org/W2128807628"],"abstract_inverted_index":{"In":[0],"recent":[1],"years,":[2],"knowledge":[3,34,37,186],"distillation":[4,38,115],"has":[5],"been":[6],"widely":[7],"used":[8],"in":[9,15,67,108,173,206],"the":[10,19,42,46,58,68,72,79,93,97,105,131,138,142,149,158,170,182,200],"field":[11],"of":[12,49,71,85,96,104,137,151,184,202],"deep":[13],"learning":[14],"order":[16],"to":[17,40,117,123,129,134,169],"reduce":[18],"model":[20,87,205],"size":[21],"and":[22,25,36,52,145],"save":[23],"time":[24],"space.":[26,175],"The":[27],"student-teacher":[28,189],"paradigm":[29],"is":[30,100,166],"a":[31,50,86,126,135,178,203],"framework":[32],"for":[33,76,181,188],"distillation,":[35],"proposed":[39],"minimize":[41],"KL":[43],"divergence":[44],"between":[45],"probabilistic":[47,59],"outputs":[48],"teacher":[51,73,106],"student":[53,98],"network.":[54,74],"However,":[55],"apart":[56],"from":[57,82,102],"outputs,":[60],"there":[61],"are":[62],"much":[63],"valuable":[64],"information":[65],"contained":[66],"middle":[69],"layers":[70,84],"As":[75],"NLP":[77],"tasks,":[78],"hidden":[80,113],"vectors":[81],"different":[83,89,101,207,210],"have":[88],"semantic":[90,163],"information,":[91,164],"but":[92],"vectors'":[94],"dimension":[95,140],"network":[99,107],"that":[103,194],"many":[109],"cases,":[110],"which":[111,165],"makes":[112],"layer":[114],"hard":[116],"be":[118],"performed":[119],"directly.":[120],"We":[121,176],"propose":[122],"simply":[124],"use":[125],"transition":[127,159],"matrix":[128,160],"project":[130],"student's":[132],"vector":[133],"space":[136,187],"same":[139],"as":[141],"teacher's":[143],"vector,":[144],"we":[146],"theoretically":[147],"prove":[148],"effectiveness":[150],"this":[152,195],"method.":[153],"Our":[154,191],"analysis":[155],"shows":[156],"how":[157],"preserve":[161],"important":[162],"closely":[167],"related":[168],"vector's":[171],"characteristic":[172],"Euclidean":[174],"provide":[177],"geometric":[179],"method":[180,196],"interpretability":[183],"shared":[185],"architectures.":[190],"experiments":[192],"show":[193],"can":[197],"significantly":[198],"improve":[199],"performance":[201],"small":[204],"tasks":[208],"with":[209],"models.":[211]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
