{"id":"https://openalex.org/W4415708094","doi":"https://doi.org/10.1109/icme59968.2025.11209494","title":"CosGaussian: Towards Text-to-3D Semantically Controllable 3D Object Style Transfer with Gaussian Splatting","display_name":"CosGaussian: Towards Text-to-3D Semantically Controllable 3D Object Style Transfer with Gaussian Splatting","publication_year":2025,"publication_date":"2025-06-30","ids":{"openalex":"https://openalex.org/W4415708094","doi":"https://doi.org/10.1109/icme59968.2025.11209494"},"language":null,"primary_location":{"id":"doi:10.1109/icme59968.2025.11209494","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icme59968.2025.11209494","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Multimedia and Expo (ICME)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100639804","display_name":"Wendong Li","orcid":"https://orcid.org/0000-0002-4388-1966"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wendong Li","raw_affiliation_strings":["Sun Yat-sen University,School of Computer Science and Engineering,Guangzhou,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Sun Yat-sen University,School of Computer Science and Engineering,Guangzhou,China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101900911","display_name":"Gaojie Wu","orcid":"https://orcid.org/0000-0002-0752-8508"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Gaojie Wu","raw_affiliation_strings":["Sun Yat-sen University,School of Computer Science and Engineering,Guangzhou,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Sun Yat-sen University,School of Computer Science and Engineering,Guangzhou,China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Xiang Huang","orcid":null},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiang Huang","raw_affiliation_strings":["Sun Yat-sen University,School of Computer Science and Engineering,Guangzhou,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Sun Yat-sen University,School of Computer Science and Engineering,Guangzhou,China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5108050904","display_name":"Wei\u2010Shi Zheng","orcid":"https://orcid.org/0000-0001-8327-0003"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei-Shi Zheng","raw_affiliation_strings":["Sun Yat-sen University,School of Computer Science and Engineering,Guangzhou,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Sun Yat-sen University,School of Computer Science and Engineering,Guangzhou,China","institution_ids":["https://openalex.org/I157773358"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.27087838,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.423799991607666,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.423799991607666,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.36419999599456787,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10481","display_name":"Computer Graphics and Visualization Techniques","score":0.09669999778270721,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/style","display_name":"Style (visual arts)","score":0.5910999774932861},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5443999767303467},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4693000018596649},{"id":"https://openalex.org/keywords/transfer","display_name":"Transfer (computing)","score":0.427700012922287},{"id":"https://openalex.org/keywords/image-editing","display_name":"Image editing","score":0.4196999967098236},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.37070000171661377}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8052999973297119},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6079000234603882},{"id":"https://openalex.org/C2776445246","wikidata":"https://www.wikidata.org/wiki/Q1792644","display_name":"Style (visual arts)","level":2,"score":0.5910999774932861},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5443999767303467},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4893999993801117},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4693000018596649},{"id":"https://openalex.org/C2776175482","wikidata":"https://www.wikidata.org/wiki/Q1195816","display_name":"Transfer (computing)","level":2,"score":0.427700012922287},{"id":"https://openalex.org/C2776674983","wikidata":"https://www.wikidata.org/wiki/Q545981","display_name":"Image editing","level":3,"score":0.4196999967098236},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.37070000171661377},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3249000012874603},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.30709999799728394},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.2904999852180481},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.28029999136924744},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.2685999870300293},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.26460000872612},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.25369998812675476}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icme59968.2025.11209494","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icme59968.2025.11209494","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Multimedia and Expo (ICME)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W2603777577","https://openalex.org/W2738551266","https://openalex.org/W2798520250","https://openalex.org/W2962785568","https://openalex.org/W3034921716","https://openalex.org/W3109908659","https://openalex.org/W3215769467","https://openalex.org/W4221151978","https://openalex.org/W4286611176","https://openalex.org/W4312234520","https://openalex.org/W4312325284","https://openalex.org/W4312453532","https://openalex.org/W4385318467","https://openalex.org/W4385481295","https://openalex.org/W4386075604","https://openalex.org/W4386076215","https://openalex.org/W4387969181","https://openalex.org/W4390874575","https://openalex.org/W4402702918","https://openalex.org/W4402727529","https://openalex.org/W4402753826","https://openalex.org/W4404520200","https://openalex.org/W4411143022","https://openalex.org/W4413786056"],"related_works":[],"abstract_inverted_index":{"With":[0],"the":[1,53,68,101],"rapid":[2],"advancement":[3],"of":[4,52,71],"3D":[5,7,16,25,31,111,134],"technologies,":[6],"editing":[8,24],"techniques":[9],"have":[10],"become":[11],"increasingly":[12],"important,":[13],"among":[14],"which":[15],"stylization":[17,32,69,122],"serves":[18],"as":[19],"a":[20,43,92,127],"crucial":[21],"tool":[22],"for":[23,82,131],"surfaces.":[26],"However,":[27],"semantically":[28,132],"controllable":[29,133],"object-level":[30],"remains":[33],"an":[34],"open":[35],"challenge.":[36],"In":[37],"this":[38],"article,":[39],"we":[40,86],"propose":[41],"CosGaussian,":[42],"framework":[44],"based":[45],"on":[46],"3DGS":[47],"that":[48,97,115],"enables":[49],"precise":[50],"control":[51],"transfer":[54,95,100],"style":[55,79,94,103,105,135],"in":[56,110,120],"object-level.":[57],"Firstly,":[58],"by":[59],"leveraging":[60],"Vision-Language":[61],"Models":[62],"(VLMs),":[63],"CosGaussian":[64,116],"can":[65,98],"effectively":[66],"extract":[67],"intentions":[70],"textual":[72],"input":[73],"from":[74,104],"user":[75],"and":[76,124],"generate":[77],"corresponding":[78],"reference":[80,106],"image":[81,107],"subsequent":[83],"stylization.":[84],"Then,":[85],"introduce":[87],"Adaptive":[88],"Feature":[89],"Transfer":[90],"(AFT),":[91],"semantics-aware":[93],"method":[96],"accurately":[99],"local":[102],"to":[108],"objects":[109],"scenes.":[112],"Experiments":[113],"demonstrate":[114],"outperforms":[117],"state-of-the-art":[118],"methods":[119],"both":[121],"accuracy":[123],"quality,":[125],"presenting":[126],"robust,":[128],"user-friendly":[129],"solution":[130],"transfer.":[136]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-30T00:00:00"}
