{"id":"https://openalex.org/W7131400110","doi":"https://doi.org/10.48550/arxiv.2602.19575","title":"ConceptPrism: Concept Disentanglement in Personalized Diffusion Models via Residual Token Optimization","display_name":"ConceptPrism: Concept Disentanglement in Personalized Diffusion Models via Residual Token Optimization","publication_year":2026,"publication_date":"2026-02-23","ids":{"openalex":"https://openalex.org/W7131400110","doi":"https://doi.org/10.48550/arxiv.2602.19575"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2602.19575","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.19575","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2602.19575","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5126256704","display_name":"Minseo Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Minseo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112924032","display_name":"Minchan Kwon","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kwon, Minchan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060156849","display_name":"Dongyeun Lee","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lee, Dongyeun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001840155","display_name":"Yunho Jeon","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jeon, Yunho","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5100606264","display_name":"Jun-Mo Kim","orcid":"https://orcid.org/0000-0002-2238-3255"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Junmo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.7796000242233276,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.7796000242233276,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.08640000224113464,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.06270000338554382,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.8187999725341797},{"id":"https://openalex.org/keywords/residual","display_name":"Residual","score":0.7567999958992004},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.6549000144004822},{"id":"https://openalex.org/keywords/fidelity","display_name":"Fidelity","score":0.6517000198364258},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.4462999999523163},{"id":"https://openalex.org/keywords/flexibility","display_name":"Flexibility (engineering)","score":0.43799999356269836}],"concepts":[{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.8187999725341797},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.804099977016449},{"id":"https://openalex.org/C155512373","wikidata":"https://www.wikidata.org/wiki/Q287450","display_name":"Residual","level":2,"score":0.7567999958992004},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.6549000144004822},{"id":"https://openalex.org/C2776459999","wikidata":"https://www.wikidata.org/wiki/Q2119376","display_name":"Fidelity","level":2,"score":0.6517000198364258},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.477400004863739},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.4462999999523163},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.43799999356269836},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.38199999928474426},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3781000077724457},{"id":"https://openalex.org/C113364801","wikidata":"https://www.wikidata.org/wiki/Q26674","display_name":"High fidelity","level":2,"score":0.329800009727478},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.31690001487731934},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.28700000047683716},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.2840000092983246},{"id":"https://openalex.org/C2988416141","wikidata":"https://www.wikidata.org/wiki/Q6031139","display_name":"Information loss","level":2,"score":0.2700999975204468},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.26930001378059387},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2646999955177307},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.25040000677108765}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2602.19575","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.19575","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2602.19575","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.19575","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Reduced inequalities","score":0.8245305418968201,"id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Personalized":[0],"text-to-image":[1],"(T2I)":[2],"generation":[3],"has":[4],"emerged":[5],"as":[6],"a":[7,15,78,94],"key":[8],"application":[9],"for":[10],"creating":[11],"user-specific":[12],"concepts":[13],"from":[14,29],"few":[16],"reference":[17],"images.":[18],"The":[19,150],"core":[20],"challenge":[21],"is":[22,152],"concept":[23,28,52,137],"disentanglement:":[24],"separating":[25],"the":[26,49,113,122,127],"target":[27,95,123],"irrelevant":[30],"residual":[31,99,111],"information.":[32,90],"Lacking":[33],"such":[34],"disentanglement,":[35],"capturing":[36],"high-fidelity":[37],"features":[38,83],"often":[39,65],"incorporates":[40],"undesired":[41],"attributes":[42],"that":[43,80,120,133],"conflict":[44],"with":[45],"user":[46],"prompts,":[47],"compromising":[48],"trade-off":[50],"between":[51],"fidelity":[53],"and":[54,72,97,103,139,146],"text":[55],"alignment.":[56],"While":[57],"existing":[58],"methods":[59],"rely":[60],"on":[61],"manual":[62],"guidance,":[63],"they":[64],"fail":[66],"to":[67,125],"represent":[68],"intricate":[69],"visual":[70,148],"details":[71],"lack":[73],"scalability.":[74],"We":[75,91],"introduce":[76],"ConceptPrism,":[77],"framework":[79],"extracts":[81],"shared":[82,108],"exclusively":[84],"through":[85],"cross-image":[86],"comparison":[87],"without":[88],"external":[89],"jointly":[92],"optimize":[93],"token":[96,124],"image-wise":[98],"tokens":[100],"via":[101],"reconstruction":[102],"exclusion":[104,114],"losses.":[105],"By":[106],"suppressing":[107],"information":[109,118],"in":[110],"tokens,":[112],"loss":[115],"creates":[116],"an":[117],"vacuum":[119],"forces":[121],"capture":[126],"common":[128],"concept.":[129],"Extensive":[130],"evaluations":[131],"demonstrate":[132],"ConceptPrism":[134],"achieves":[135],"accurate":[136],"disentanglement":[138],"significantly":[140],"improves":[141],"overall":[142],"performance":[143],"across":[144],"diverse":[145],"complex":[147],"concepts.":[149],"code":[151],"available":[153],"at":[154],"https://github.com/Minseo-Kimm/ConceptPrism.":[155]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-02-26T00:00:00"}
