{"id":"https://openalex.org/W7164806866","doi":"https://doi.org/10.1145/3805622.3810591","title":"CREAM: Collaborative Representation with Self-supervised Alignment for Multimedia Recommendation","display_name":"CREAM: Collaborative Representation with Self-supervised Alignment for Multimedia Recommendation","publication_year":2026,"publication_date":"2026-06-15","ids":{"openalex":"https://openalex.org/W7164806866","doi":"https://doi.org/10.1145/3805622.3810591"},"language":null,"primary_location":{"id":"doi:10.1145/3805622.3810591","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3805622.3810591","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2026 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3805622.3810591","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5138661332","display_name":"Junhao Gao","orcid":"https://orcid.org/0009-0001-5567-1325"},"institutions":[{"id":"https://openalex.org/I16609230","display_name":"Hunan University","ror":"https://ror.org/05htk5m33","country_code":"CN","type":"education","lineage":["https://openalex.org/I16609230"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Junhao Gao","raw_affiliation_strings":["Hunan University, College of Computer Science and Electronic Engineering, Changsha, Hunan, China"],"raw_orcid":"https://orcid.org/0009-0001-5567-1325","affiliations":[{"raw_affiliation_string":"Hunan University, College of Computer Science and Electronic Engineering, Changsha, Hunan, China","institution_ids":["https://openalex.org/I16609230"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100604018","display_name":"Chao Yang","orcid":"https://orcid.org/0000-0001-8774-8115"},"institutions":[{"id":"https://openalex.org/I16609230","display_name":"Hunan University","ror":"https://ror.org/05htk5m33","country_code":"CN","type":"education","lineage":["https://openalex.org/I16609230"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chao Yang","raw_affiliation_strings":["Hunan University, College of Computer Science and Electronic Engineering, Changsha, Hunan, China"],"raw_orcid":"https://orcid.org/0000-0001-8774-8115","affiliations":[{"raw_affiliation_string":"Hunan University, College of Computer Science and Electronic Engineering, Changsha, Hunan, China","institution_ids":["https://openalex.org/I16609230"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5007360513","display_name":"Bin Jiang","orcid":"https://orcid.org/0000-0002-5840-9664"},"institutions":[{"id":"https://openalex.org/I16609230","display_name":"Hunan University","ror":"https://ror.org/05htk5m33","country_code":"CN","type":"education","lineage":["https://openalex.org/I16609230"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bin Jiang","raw_affiliation_strings":["Hunan University, College of Computer Science and Electronic Engineering, Changsha, Hunan, China"],"raw_orcid":"https://orcid.org/0000-0002-5840-9664","affiliations":[{"raw_affiliation_string":"Hunan University, College of Computer Science and Electronic Engineering, Changsha, Hunan, China","institution_ids":["https://openalex.org/I16609230"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.96149997,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"298","last_page":"307"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.7853999733924866,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.7853999733924866,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.050200000405311584,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.026399999856948853,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/interactivity","display_name":"Interactivity","score":0.722599983215332},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.6341000199317932},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.49480000138282776},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.45879998803138733},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.44440001249313354},{"id":"https://openalex.org/keywords/node","display_name":"Node (physics)","score":0.3763999938964844},{"id":"https://openalex.org/keywords/personalization","display_name":"Personalization","score":0.3725999891757965},{"id":"https://openalex.org/keywords/recommender-system","display_name":"Recommender system","score":0.3483999967575073}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8478999733924866},{"id":"https://openalex.org/C144430266","wikidata":"https://www.wikidata.org/wiki/Q839721","display_name":"Interactivity","level":2,"score":0.722599983215332},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.6341000199317932},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.49480000138282776},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.4796000123023987},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.45879998803138733},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.44440001249313354},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.421999990940094},{"id":"https://openalex.org/C62611344","wikidata":"https://www.wikidata.org/wiki/Q1062658","display_name":"Node (physics)","level":2,"score":0.3763999938964844},{"id":"https://openalex.org/C183003079","wikidata":"https://www.wikidata.org/wiki/Q1000371","display_name":"Personalization","level":2,"score":0.3725999891757965},{"id":"https://openalex.org/C557471498","wikidata":"https://www.wikidata.org/wiki/Q554950","display_name":"Recommender system","level":2,"score":0.3483999967575073},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.34139999747276306},{"id":"https://openalex.org/C173414695","wikidata":"https://www.wikidata.org/wiki/Q5510276","display_name":"Fusion mechanism","level":4,"score":0.33239999413490295},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.32989999651908875},{"id":"https://openalex.org/C67712803","wikidata":"https://www.wikidata.org/wiki/Q7901853","display_name":"User modeling","level":3,"score":0.3151000142097473},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.31380000710487366},{"id":"https://openalex.org/C135641252","wikidata":"https://www.wikidata.org/wiki/Q738567","display_name":"Multimodal interaction","level":2,"score":0.2924000024795532},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.2870999872684479},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.27900001406669617},{"id":"https://openalex.org/C2780126544","wikidata":"https://www.wikidata.org/wiki/Q837900","display_name":"Hypermedia","level":2,"score":0.26460000872612},{"id":"https://openalex.org/C2780617661","wikidata":"https://www.wikidata.org/wiki/Q541563","display_name":"Subcategory","level":2,"score":0.25600001215934753},{"id":"https://openalex.org/C21569690","wikidata":"https://www.wikidata.org/wiki/Q94702","display_name":"Collaborative filtering","level":3,"score":0.25}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3805622.3810591","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3805622.3810591","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2026 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3805622.3810591","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3805622.3810591","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2026 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G6668546377","display_name":null,"funder_award_id":"62172156","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W1804536132","https://openalex.org/W1888005072","https://openalex.org/W2027731328","https://openalex.org/W2512971201","https://openalex.org/W2614794251","https://openalex.org/W2742143754","https://openalex.org/W2807021761","https://openalex.org/W2913023375","https://openalex.org/W2945827670","https://openalex.org/W2962907114","https://openalex.org/W2963655167","https://openalex.org/W2964258748","https://openalex.org/W2982108874","https://openalex.org/W3035524453","https://openalex.org/W3035725276","https://openalex.org/W3045200674","https://openalex.org/W3094605801","https://openalex.org/W3192113933","https://openalex.org/W3211143493","https://openalex.org/W4224983022","https://openalex.org/W4226210383","https://openalex.org/W4285288414","https://openalex.org/W4309185982","https://openalex.org/W4321593910","https://openalex.org/W4322718576","https://openalex.org/W4385270524","https://openalex.org/W4385682046","https://openalex.org/W4385825460","https://openalex.org/W4386845623","https://openalex.org/W4390451911","https://openalex.org/W4393159797","https://openalex.org/W4402404329","https://openalex.org/W4403221702","https://openalex.org/W4403577865","https://openalex.org/W4409364924","https://openalex.org/W4409364994","https://openalex.org/W4409365290","https://openalex.org/W4411635449","https://openalex.org/W7129226449","https://openalex.org/W7133215288"],"related_works":[],"abstract_inverted_index":{"Recent":[0],"works":[1],"in":[2],"multimedia":[3,10],"recommendation":[4],"combine":[5],"interaction":[6],"data":[7],"with":[8,110,151],"rich":[9],"content":[11],"to":[12,38,69,127],"generate":[13],"personalized":[14],"recommendations,":[15],"which":[16,43],"has":[17],"attracted":[18],"considerable":[19],"attention.":[20],"Despite":[21],"their":[22],"effectiveness,":[23],"the":[24,39,96,203],"existing":[25],"methods":[26],"still":[27],"suffer":[28],"from":[29,98],"three":[30,199],"limitations:":[31],"(1)":[32],"Incomplete":[33],"user":[34,129],"preference":[35],"modeling":[36,144],"due":[37],"late":[40,125],"fusion":[41,126],"strategy":[42],"ignores":[44],"modality":[45,49,76,86,137],"interactivity":[46,134],"and":[47,67,88,135,159,190],"user-specific":[48],"preference;":[50],"(2)":[51],"Insufficient":[52],"multimodal":[53],"item":[54],"representation":[55],"caused":[56],"by":[57],"conventional":[58],"homogeneous":[59],"graph":[60,150],"structure":[61],"that":[62,145,185],"faces":[63],"a":[64,106,120,147,152,167,181],"message-passing":[65,157],"bottleneck":[66],"struggles":[68],"capture":[70],"two-hop":[71,161],"node":[72,162],"similarity;":[73],"(3)":[74],"Ineffective":[75],"alignment":[77,94,169,184],"based":[78,170],"on":[79,171,198],"entity-specific":[80],"fine-grained":[81],"mutual":[82],"information":[83],"may":[84],"undermine":[85],"specificity":[87],"semantic":[89],"richness,":[90],"while":[91],"user-item":[92,182],"behavior":[93,183],"neglects":[95],"usefulness":[97],"negative":[99,191],"feedback.":[100],"To":[101],"this":[102],"end,":[103],"we":[104,118,140,165],"propose":[105,141,180],"novel":[107],"Collaborative":[108],"Representation":[109],"SElf-supervised":[111],"Alignment":[112],"for":[113,124],"Multimedia":[114],"Recommendation":[115],"(CREAM).":[116],"Specifically,":[117],"design":[119,166],"collaborative":[121],"attention":[122],"mechanism":[123],"model":[128],"preferences,":[130],"capturing":[131,160],"both":[132],"cross-modal":[133,176],"specific":[136],"preferences.":[138],"Secondly,":[139],"dual":[142],"graph-view":[143],"combines":[146],"traditional":[148],"pair-wise":[149],"derived":[153],"group-wise":[154],"hypergraph,":[155],"improving":[156],"efficiency":[158],"similarity.":[163],"Finally,":[164],"self-supervised":[168],"Cauchy-Schwarz":[172],"divergence,":[173],"achieving":[174],"coarse-grained":[175],"alignment.":[177],"We":[178],"also":[179],"explicitly":[186],"distinguishes":[187],"users\u2019":[188],"positive":[189],"preferences":[192],"through":[193],"contrastive":[194],"learning.":[195],"Extensive":[196],"experiments":[197],"public":[200],"datasets":[201],"demonstrate":[202],"effectiveness":[204],"of":[205],"CREAM.":[206],"Our":[207],"code":[208],"is":[209],"available":[210],"at":[211],"https://github.com/GarethJellingham/CREAM.":[212]},"counts_by_year":[],"updated_date":"2026-06-16T07:37:23.134862","created_date":"2026-06-16T00:00:00"}
