{"id":"https://openalex.org/W7134817152","doi":"https://doi.org/10.48550/arxiv.2603.08589","title":"CARE-Edit: Condition-Aware Routing of Experts for Contextual Image Editing","display_name":"CARE-Edit: Condition-Aware Routing of Experts for Contextual Image Editing","publication_year":2026,"publication_date":"2026-03-09","ids":{"openalex":"https://openalex.org/W7134817152","doi":"https://doi.org/10.48550/arxiv.2603.08589"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2603.08589","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5128633624","display_name":"Yucheng Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Wang, Yucheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044435921","display_name":"Zedong Wang","orcid":"https://orcid.org/0009-0000-0112-0491"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Zedong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101894731","display_name":"Yuetong Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Yuetong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128665113","display_name":"Yue Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Yue","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5128654764","display_name":"Dan Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Dan","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5128633624"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.7594000101089478,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.7594000101089478,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10481","display_name":"Computer Graphics and Visualization Techniques","score":0.05950000137090683,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12377","display_name":"Digital Humanities and Scholarship","score":0.013399999588727951,"subfield":{"id":"https://openalex.org/subfields/1208","display_name":"Literature and Literary Theory"},"field":{"id":"https://openalex.org/fields/12","display_name":"Arts and Humanities"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/routing","display_name":"Routing (electronic design automation)","score":0.5655999779701233},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.5389000177383423},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5278000235557556},{"id":"https://openalex.org/keywords/identity","display_name":"Identity (music)","score":0.4916999936103821},{"id":"https://openalex.org/keywords/router","display_name":"Router","score":0.45660001039505005},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.4453999996185303},{"id":"https://openalex.org/keywords/concatenation","display_name":"Concatenation (mathematics)","score":0.43950000405311584},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4325000047683716},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.41679999232292175}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8360000252723694},{"id":"https://openalex.org/C74172769","wikidata":"https://www.wikidata.org/wiki/Q1446839","display_name":"Routing (electronic design automation)","level":2,"score":0.5655999779701233},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.5389000177383423},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5278000235557556},{"id":"https://openalex.org/C2778355321","wikidata":"https://www.wikidata.org/wiki/Q17079427","display_name":"Identity (music)","level":2,"score":0.4916999936103821},{"id":"https://openalex.org/C2775896111","wikidata":"https://www.wikidata.org/wiki/Q642560","display_name":"Router","level":2,"score":0.45660001039505005},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.4453999996185303},{"id":"https://openalex.org/C87619178","wikidata":"https://www.wikidata.org/wiki/Q126002","display_name":"Concatenation (mathematics)","level":2,"score":0.43950000405311584},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4325000047683716},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4189999997615814},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.41679999232292175},{"id":"https://openalex.org/C2776674983","wikidata":"https://www.wikidata.org/wiki/Q545981","display_name":"Image editing","level":3,"score":0.375},{"id":"https://openalex.org/C2775945657","wikidata":"https://www.wikidata.org/wiki/Q381442","display_name":"Structuring","level":2,"score":0.3361999988555908},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.33219999074935913},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3160000145435333},{"id":"https://openalex.org/C123403432","wikidata":"https://www.wikidata.org/wiki/Q654068","display_name":"Visibility","level":2,"score":0.30959999561309814},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.3050999939441681},{"id":"https://openalex.org/C32022120","wikidata":"https://www.wikidata.org/wiki/Q797225","display_name":"Interference (communication)","level":3,"score":0.2955999970436096},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.28999999165534973},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2822999954223633},{"id":"https://openalex.org/C31170391","wikidata":"https://www.wikidata.org/wiki/Q188619","display_name":"Hierarchy","level":2,"score":0.2784000039100647},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.27570000290870667},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.27059999108314514},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.2653999924659729},{"id":"https://openalex.org/C87868495","wikidata":"https://www.wikidata.org/wiki/Q750843","display_name":"Information processing","level":2,"score":0.25839999318122864},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.25440001487731934},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.25369998812675476},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.25270000100135803},{"id":"https://openalex.org/C16345878","wikidata":"https://www.wikidata.org/wiki/Q107472979","display_name":"Orientation (vector space)","level":2,"score":0.25049999356269836}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2603.08589","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2603.08589","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.08589","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2603.08589","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[{"display_name":"No poverty","id":"https://metadata.un.org/sdg/1","score":0.6669642329216003}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Unified":[0],"diffusion":[1,106,120],"editors":[2],"often":[3],"rely":[4],"on":[5,116,177],"a":[6,100,123,153],"fixed,":[7],"shared":[8],"backbone":[9],"for":[10,132],"diverse":[11],"tasks,":[12,180],"suffering":[13],"from":[14],"task":[15],"interference":[16],"and":[17,34,73,114,119,165,186],"poor":[18],"adaptation":[19],"to":[20,108,143,147,168,205],"heterogeneous":[21],"demands":[22],"(e.g.,":[23,41],"local":[24],"vs":[25,28],"global,":[26],"semantic":[27],"photometric).":[29],"In":[30],"particular,":[31],"prevalent":[32],"ControlNet":[33],"OmniControl":[35],"variants":[36],"combine":[37],"multiple":[38],"conditioning":[39],"signals":[40],"text,":[42],"mask,":[43],"reference)":[44],"via":[45],"static":[46],"concatenation":[47],"or":[48,55,70],"additive":[49],"adapters":[50],"which":[51],"cannot":[52],"dynamically":[53,144],"prioritize":[54],"suppress":[56],"conflicting":[57],"modalities,":[58],"thus":[59],"resulting":[60],"in":[61],"artifacts":[62],"like":[63],"color":[64],"bleeding":[65],"across":[66],"mask":[67],"boundaries,":[68],"identity":[69],"style":[71,187],"drift,":[72],"unpredictable":[74],"behavior":[75,194],"under":[76],"multi-condition":[77,207],"inputs.":[78],"To":[79],"address":[80],"this,":[81],"we":[82],"propose":[83],"Condition-Aware":[84],"Routing":[85],"of":[86,195,201],"Experts":[87],"(CARE-Edit)":[88],"that":[89],"aligns":[90],"model":[91],"computation":[92,146],"with":[93],"specific":[94],"editing":[95,179],"competencies.":[96],"At":[97],"its":[98],"core,":[99],"lightweight":[101],"latent-attention":[102],"router":[103,138],"assigns":[104],"encoded":[105],"tokens":[107],"four":[109],"specialized":[110,196],"experts--Text,":[111],"Mask,":[112],"Reference,":[113],"Base--based":[115],"multi-modal":[117],"conditions":[118],"timesteps:":[121],"(i)":[122],"Mask":[124],"Repaint":[125],"module":[126,156],"first":[127],"refines":[128],"coarse":[129],"user-defined":[130],"masks":[131],"precise":[133],"spatial":[134],"guidance;":[135],"(ii)":[136],"the":[137,148,169,199],"applies":[139],"sparse":[140],"top-K":[141],"selection":[142],"allocate":[145],"most":[149],"relevant":[150],"experts;":[151],"(iii)":[152],"Latent":[154],"Mixture":[155],"subsequently":[157],"fuses":[158],"expert":[159],"outputs,":[160],"coherently":[161],"integrating":[162],"semantic,":[163],"spatial,":[164],"stylistic":[166],"information":[167],"base":[170],"images.":[171],"Experiments":[172],"validate":[173],"CARE-Edit's":[174],"strong":[175],"performance":[176],"contextual":[178],"including":[181],"erasure,":[182],"replacement,":[183],"text-driven":[184],"edits,":[185],"transfer.":[188],"Empirical":[189],"analysis":[190],"further":[191],"reveals":[192],"task-specific":[193],"experts,":[197],"showcasing":[198],"importance":[200],"dynamic,":[202],"condition-aware":[203],"processing":[204],"mitigate":[206],"conflicts.":[208]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-03-11T00:00:00"}
