{"id":"https://openalex.org/W4409325826","doi":"https://doi.org/10.1109/tcss.2025.3555653","title":"Modality-Disentangled Feature Extraction via Knowledge Distillation in Multimodal Recommendation Systems","display_name":"Modality-Disentangled Feature Extraction via Knowledge Distillation in Multimodal Recommendation Systems","publication_year":2025,"publication_date":"2025-04-10","ids":{"openalex":"https://openalex.org/W4409325826","doi":"https://doi.org/10.1109/tcss.2025.3555653"},"language":"en","primary_location":{"id":"doi:10.1109/tcss.2025.3555653","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcss.2025.3555653","pdf_url":null,"source":{"id":"https://openalex.org/S2490693980","display_name":"IEEE Transactions on Computational Social Systems","issn_l":"2329-924X","issn":["2329-924X","2373-7476"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computational Social Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5077588477","display_name":"Haibing Hu","orcid":"https://orcid.org/0000-0003-1207-4472"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Haibing Hu","raw_affiliation_strings":["School of Computer Science and Technology, University of Science and Technology of China, Hefei, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108133841","display_name":"Yuehong Xie","orcid":null},"institutions":[{"id":"https://openalex.org/I4210146919","display_name":"Shanghai Industrial Technology Institute","ror":"https://ror.org/03j1pdd39","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210146919"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yangyi Xie","raw_affiliation_strings":["Industrial Field, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Industrial Field, Shanghai, China","institution_ids":["https://openalex.org/I4210146919"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085254654","display_name":"Defu Lian","orcid":"https://orcid.org/0000-0002-3507-9607"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Defu Lian","raw_affiliation_strings":["School of Computer Science and Technology, University of Science and Technology of China, Hefei, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5084367706","display_name":"Kai Han","orcid":"https://orcid.org/0000-0002-6302-5366"},"institutions":[{"id":"https://openalex.org/I3923682","display_name":"Soochow University","ror":"https://ror.org/05t8y2r12","country_code":"CN","type":"education","lineage":["https://openalex.org/I3923682"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kai Han","raw_affiliation_strings":["School of Computer Science and Technology, Soochow University, Suzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Soochow University, Suzhou, China","institution_ids":["https://openalex.org/I3923682"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5077588477"],"corresponding_institution_ids":["https://openalex.org/I126520041"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.03490849,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"12","issue":"6","first_page":"4517","last_page":"4531"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9864000082015991,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9864000082015991,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9796000123023987,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9753999710083008,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.6641598343849182},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6593331694602966},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6241051554679871},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.601134717464447},{"id":"https://openalex.org/keywords/distillation","display_name":"Distillation","score":0.5307213068008423},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.48093101382255554},{"id":"https://openalex.org/keywords/extraction","display_name":"Extraction (chemistry)","score":0.4621048867702484},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.42308229207992554},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3691387176513672},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.33260971307754517},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.33126550912857056},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.09853300452232361},{"id":"https://openalex.org/keywords/chromatography","display_name":"Chromatography","score":0.08470165729522705}],"concepts":[{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.6641598343849182},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6593331694602966},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6241051554679871},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.601134717464447},{"id":"https://openalex.org/C204030448","wikidata":"https://www.wikidata.org/wiki/Q101017","display_name":"Distillation","level":2,"score":0.5307213068008423},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.48093101382255554},{"id":"https://openalex.org/C4725764","wikidata":"https://www.wikidata.org/wiki/Q844704","display_name":"Extraction (chemistry)","level":2,"score":0.4621048867702484},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.42308229207992554},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3691387176513672},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.33260971307754517},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.33126550912857056},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.09853300452232361},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.08470165729522705},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcss.2025.3555653","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcss.2025.3555653","pdf_url":null,"source":{"id":"https://openalex.org/S2490693980","display_name":"IEEE Transactions on Computational Social Systems","issn_l":"2329-924X","issn":["2329-924X","2373-7476"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computational Social Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":48,"referenced_works":["https://openalex.org/W1949478088","https://openalex.org/W1964073652","https://openalex.org/W2027731328","https://openalex.org/W2028988057","https://openalex.org/W2061212083","https://openalex.org/W2061873838","https://openalex.org/W2069682406","https://openalex.org/W2509893387","https://openalex.org/W2604433096","https://openalex.org/W2605350416","https://openalex.org/W2767724106","https://openalex.org/W2798713837","https://openalex.org/W2807722546","https://openalex.org/W2808847742","https://openalex.org/W2945827670","https://openalex.org/W2963655167","https://openalex.org/W2963871344","https://openalex.org/W2963890275","https://openalex.org/W2964258748","https://openalex.org/W2969960436","https://openalex.org/W2970231061","https://openalex.org/W2982108874","https://openalex.org/W3044311607","https://openalex.org/W3045200674","https://openalex.org/W3090865871","https://openalex.org/W3093002391","https://openalex.org/W3093502611","https://openalex.org/W3100652389","https://openalex.org/W3106867121","https://openalex.org/W4224326485","https://openalex.org/W4225308835","https://openalex.org/W4226048133","https://openalex.org/W4322718576","https://openalex.org/W4361230837","https://openalex.org/W4376132596","https://openalex.org/W4377715604","https://openalex.org/W4388187692","https://openalex.org/W4389934670","https://openalex.org/W4390908079","https://openalex.org/W4392083355","https://openalex.org/W4393405236","https://openalex.org/W4395027812","https://openalex.org/W4400078320","https://openalex.org/W4400228958","https://openalex.org/W4401090676","https://openalex.org/W4403933898","https://openalex.org/W4404244857","https://openalex.org/W4405838414"],"related_works":["https://openalex.org/W2385859805","https://openalex.org/W2530972254","https://openalex.org/W2374013449","https://openalex.org/W73545470","https://openalex.org/W2364381299","https://openalex.org/W2374430585","https://openalex.org/W3144423903","https://openalex.org/W2377397762","https://openalex.org/W2793967660","https://openalex.org/W2361654993"],"abstract_inverted_index":{"Multimodal":[0,45],"recommendation":[1,6,46,91,124,179,406],"enhances":[2,252],"item":[3,13,23,36],"representation":[4,37,75,218],"in":[5,89,118,151,177,307,314,451],"systems":[7,57],"by":[8,95],"integrating":[9,141],"diverse":[10],"modalities":[11],"of":[12,35,43,56,70,76,84,102,135,282,304,366,381,390,398,429,461],"information":[14,142,312,346,357,376],"beyond":[15],"traditional":[16],"ID-based":[17],"features.":[18,260],"This":[19,249,298,393],"approach":[20,65,202],"utilizes":[21],"supplementary":[22],"details,":[24],"including":[25],"images,":[26],"text,":[27],"videos,":[28],"and":[29,38,73,222,234,287,310,324,344,351,358,377,438],"audio,":[30],"to":[31,66,127,183,216,242,257,270,318,417,457],"refine":[32],"the":[33,41,54,68,74,81,87,100,147,185,253,262,265,271,289,295,302,322,348,364,371,379,388,396,405,410,426],"accuracy":[34],"thereby":[39,79],"boost":[40],"precision":[42],"recommendations.":[44,85],"has":[47,138],"emerged":[48],"as":[49,239],"a":[50,63,132,159,204,283,332,419,448,459],"vibrant":[51],"field":[52],"within":[53],"scope":[55],"that":[58,188],"generate":[59],"suggestions.":[60],"It":[61],"offers":[62],"powerful":[64],"address":[67],"challenges":[69],"data":[71,120,305],"scarcity":[72],"long-tail":[77],"content,":[78],"improving":[80],"overall":[82],"quality":[83],"However,":[86],"advancement":[88],"multimodal":[90,104,178,192,259],"is":[92,227,268],"currently":[93],"hindered":[94],"two":[96],"main":[97],"obstacles.":[98],"First,":[99,182],"process":[101,250],"extracting":[103,191],"features":[105,193,326],"from":[106,220,264,347],"pre-trained":[107],"models":[108],"using":[109],"either":[110,195],"shallow":[111,198,284,315],"or":[112,122,197],"deep":[113,196,211,308],"neural":[114,199,212,285],"networks":[115,213,309,350],"often":[116,145],"results":[117,445],"insufficient":[119,311],"extraction":[121,313],"sparse":[123],"data,":[125],"leading":[126],"suboptimal":[128],"model":[129],"performance.":[130],"Second,":[131,317],"significant":[133,449],"portion":[134],"previous":[136],"research":[137],"focused":[139],"on":[140,294,440],"across":[143],"modalities,":[144,329],"overlooking":[146],"distinct":[148,325],"characteristics":[149],"inherent":[150],"different":[152,328],"modalities.":[153],"Addressing":[154],"these":[155],"challenges,":[156],"we":[157,292,330,369,403,414,433],"introduce":[158],"unique":[160],"methodology":[161],"titled":[162],"\u201c<underline":[163],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[164,166,170,175],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">mo</u>dality-<underline":[165],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">d</u>isentangled":[167],"feature":[168,400],"<underline":[169],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">e</u>xtraction":[171],"via":[172,231],"knowledge":[173,263,275],"di<underline":[174],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">st</u>illation":[176],"systems\u201d":[180],"(MODEST).":[181],"tackle":[184],"aforementioned":[186],"problems":[187],"arise":[189],"when":[190],"with":[194,387,409],"networks,":[200],"our":[201,430,452],"adopts":[203],"teacher\u2013student":[205,349],"network":[206,267,273,279],"framework.":[207],"In":[208],"this":[209],"framework,":[210],"are":[214,237],"utilized":[215],"extract":[217,258],"vectors":[219],"text":[221,343],"image":[223,345],"data.":[224],"Feature":[225],"fusion":[226],"then":[228],"carried":[229],"out":[230],"attention":[232],"mechanisms,":[233],"semantic":[235],"labels":[236,241],"employed":[238],"classification":[240],"derive":[243],"three":[244],"supervised":[245],"learning":[246],"loss":[247,407,412],"functions.":[248],"significantly":[251],"teacher":[254,266],"network\u2019s":[255],"capacity":[256],"Subsequently,":[261],"transferred":[269],"student":[272,278,296],"through":[274],"distillation.":[276],"The":[277,444],"makes":[280],"use":[281],"network,":[286],"during":[288],"inference":[290],"stage,":[291],"rely":[293],"network.":[297],"strategy":[299],"effectively":[300,320,394],"resolves":[301],"issues":[303],"sparsity":[306],"networks.":[316],"more":[319],"capture":[321],"similarities":[323],"among":[327],"implement":[331],"disentangled":[333],"modality":[334],"decomposition":[335],"technique.":[336],"Through":[337],"integrated":[338],"mappings,":[339],"it":[340,456],"separately":[341],"extracts":[342],"decomposes":[352],"them":[353],"into":[354],"cross-modality":[355,359,374,382,399],"common":[356,375],"specific":[360,383],"information.":[361],"By":[362],"applying":[363],"constraints":[365,413],"contrastive":[367],"learning,":[368],"minimize":[370],"distance":[372],"between":[373],"maximize":[378],"separation":[380],"information,":[384],"promoting":[385],"convergence":[386],"aid":[389],"auxiliary":[391],"loss.":[392],"addresses":[395],"problem":[397],"alignment.":[401],"Lastly,":[402],"combine":[404],"function":[408],"multiple":[411],"have":[415,434],"added":[416],"formulate":[418],"unified":[420],"optimization":[421],"objective":[422],"function.":[423],"To":[424],"underscore":[425],"remarkable":[427],"efficacy":[428],"proposed":[431],"model,":[432],"executed":[435],"comprehensive":[436],"experiments":[437],"visualizations":[439],"several":[441],"real-world":[442],"datasets.":[443],"distinctly":[446],"show":[447],"enhancement":[450],"model\u2019s":[453],"performance,":[454],"allowing":[455],"achieve":[458],"level":[460],"competitiveness":[462],"against":[463],"other":[464],"methods.":[465]},"counts_by_year":[],"updated_date":"2025-12-03T23:09:05.601824","created_date":"2025-10-10T00:00:00"}
