{"id":"https://openalex.org/W7139925732","doi":"https://doi.org/10.48550/arxiv.2603.19158","title":"Adaptive Auxiliary Prompt Blending for Target-Faithful Diffusion Generation","display_name":"Adaptive Auxiliary Prompt Blending for Target-Faithful Diffusion Generation","publication_year":2026,"publication_date":"2026-03-19","ids":{"openalex":"https://openalex.org/W7139925732","doi":"https://doi.org/10.48550/arxiv.2603.19158"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.19158","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.19158","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.19158","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5130242073","display_name":"Kwanyoung Lee","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Lee, Kwanyoung","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056418200","display_name":"SeungJu Cha","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cha, SeungJu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130233980","display_name":"Yebin Ahn","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ahn, Yebin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130246411","display_name":"Hyunwoo Oh","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Oh, Hyunwoo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049890458","display_name":"Sungho Koh","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Koh, Sungho","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5130227668","display_name":"Dong-Jin Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Dong-Jin","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5130242073"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9298999905586243,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9298999905586243,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.023399999365210533,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.010900000110268593,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/interpolation","display_name":"Interpolation (computer graphics)","score":0.7578999996185303},{"id":"https://openalex.org/keywords/fidelity","display_name":"Fidelity","score":0.7026000022888184},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5659999847412109},{"id":"https://openalex.org/keywords/heuristic","display_name":"Heuristic","score":0.5246999859809875},{"id":"https://openalex.org/keywords/diffusion","display_name":"Diffusion","score":0.45820000767707825},{"id":"https://openalex.org/keywords/adaptive-optimization","display_name":"Adaptive optimization","score":0.36500000953674316},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.33970001339912415},{"id":"https://openalex.org/keywords/alternation","display_name":"Alternation (linguistics)","score":0.3197999894618988}],"concepts":[{"id":"https://openalex.org/C137800194","wikidata":"https://www.wikidata.org/wiki/Q11713455","display_name":"Interpolation (computer graphics)","level":3,"score":0.7578999996185303},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7386999726295471},{"id":"https://openalex.org/C2776459999","wikidata":"https://www.wikidata.org/wiki/Q2119376","display_name":"Fidelity","level":2,"score":0.7026000022888184},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5659999847412109},{"id":"https://openalex.org/C173801870","wikidata":"https://www.wikidata.org/wiki/Q201413","display_name":"Heuristic","level":2,"score":0.5246999859809875},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4661000072956085},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.45820000767707825},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3840999901294708},{"id":"https://openalex.org/C149672232","wikidata":"https://www.wikidata.org/wiki/Q337048","display_name":"Adaptive optimization","level":2,"score":0.36500000953674316},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.33970001339912415},{"id":"https://openalex.org/C26826806","wikidata":"https://www.wikidata.org/wiki/Q438358","display_name":"Alternation (linguistics)","level":2,"score":0.3197999894618988},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3127000033855438},{"id":"https://openalex.org/C113364801","wikidata":"https://www.wikidata.org/wiki/Q26674","display_name":"High fidelity","level":2,"score":0.30630001425743103},{"id":"https://openalex.org/C2982777018","wikidata":"https://www.wikidata.org/wiki/Q99268086","display_name":"Adaptive design","level":3,"score":0.29739999771118164},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.29490000009536743},{"id":"https://openalex.org/C2776674983","wikidata":"https://www.wikidata.org/wiki/Q545981","display_name":"Image editing","level":3,"score":0.2897000014781952},{"id":"https://openalex.org/C149364088","wikidata":"https://www.wikidata.org/wiki/Q185917","display_name":"Translation (biology)","level":4,"score":0.26989999413490295},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.26589998602867126},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.26190000772476196},{"id":"https://openalex.org/C200873422","wikidata":"https://www.wikidata.org/wiki/Q5448821","display_name":"Filling-in","level":2,"score":0.26019999384880066},{"id":"https://openalex.org/C171836373","wikidata":"https://www.wikidata.org/wiki/Q2266329","display_name":"Linear interpolation","level":3,"score":0.25360000133514404},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.2533999979496002}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.19158","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.19158","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.19158","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.19158","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.4548763334751129,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Diffusion-based":[0],"text-to-image":[1],"(T2I)":[2],"models":[3,29],"have":[4],"made":[5],"remarkable":[6],"progress":[7],"in":[8,21,75,87,94,134],"generating":[9],"photorealistic":[10],"and":[11,91,125,142,151,167,175,182],"semantically":[12,32],"rich":[13],"images.":[14],"However,":[15],"when":[16],"the":[17,25,42,72,101,119,122,126,156,173],"target":[18,102,127],"concepts":[19,50],"lie":[20],"low-density":[22,76],"regions":[23],"of":[24,45,158],"training":[26],"distribution,":[27],"these":[28],"often":[30],"produce":[31],"misaligned":[33],"or":[34,51],"structurally":[35],"inconsistent":[36],"results.":[37],"This":[38],"limitation":[39],"arises":[40],"from":[41],"long-tailed":[43],"nature":[44],"text-image":[46],"datasets,":[47,177],"where":[48],"rare":[49,88],"editing":[52],"instructions":[53],"are":[54],"underrepresented.":[55],"To":[56],"address":[57],"this,":[58],"we":[59],"introduce":[60],"Adaptive":[61],"Auxiliary":[62],"Prompt":[63],"Blending":[64],"(AAPB)":[65],"-":[66],"a":[67,112,140],"unified":[68],"framework":[69,144],"that":[70,116],"stabilizes":[71],"diffusion":[73,131],"process":[74],"regions.":[77],"AAPB":[78,110],"leverages":[79],"auxiliary":[80,123],"anchor":[81,124],"prompts":[82],"to":[83,186],"provide":[84],"semantic":[85,180],"support":[86,93],"concept":[89],"generation":[90],"structural":[92,183],"image":[95],"editing,":[96],"ensuring":[97,149],"faithful":[98],"guidance":[99],"toward":[100],"prompt.":[103],"Unlike":[104],"prior":[105,187],"heuristic":[106],"prompt":[107,128,147],"alternation":[108],"methods,":[109],"derives":[111],"closed-form":[113],"adaptive":[114,146,159],"coefficient":[115],"optimally":[117],"balances":[118],"influence":[120],"between":[121],"at":[129],"each":[130],"step.":[132],"Grounded":[133],"Tweedie's":[135],"identity,":[136],"our":[137],"formulation":[138],"provides":[139],"principled":[141],"training-free":[143,188],"for":[145],"blending,":[148],"stable":[150],"target-faithful":[152],"generation.":[153],"We":[154],"demonstrate":[155],"effectiveness":[157],"interpolation":[160,163],"over":[161],"fixed":[162],"through":[164],"controlled":[165],"experiments":[166],"empirically":[168],"show":[169],"consistent":[170],"improvements":[171],"on":[172],"RareBench":[174],"FlowEdit":[176],"achieving":[178],"superior":[179],"accuracy":[181],"fidelity":[184],"compared":[185],"baselines.":[189]},"counts_by_year":[],"updated_date":"2026-03-21T06:36:02.116451","created_date":"2026-03-21T00:00:00"}
