{"id":"https://openalex.org/W7117760764","doi":"https://doi.org/10.48550/arxiv.2512.22437","title":"EmoCtrl: Controllable Emotional Image Content Generation","display_name":"EmoCtrl: Controllable Emotional Image Content Generation","publication_year":2025,"publication_date":"2025-12-27","ids":{"openalex":"https://openalex.org/W7117760764","doi":"https://doi.org/10.48550/arxiv.2512.22437"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2512.22437","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.22437","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2512.22437","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5121672838","display_name":"Jingyuan Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Yang, Jingyuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100298507","display_name":"Weibin Luo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Luo, Weibin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5121639247","display_name":"Hui Huang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Hui","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5121672838"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.5457000136375427,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.5457000136375427,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.1378999948501587,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.050700001418590546,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/content","display_name":"Content (measure theory)","score":0.6039999723434448},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.5753999948501587},{"id":"https://openalex.org/keywords/adaptability","display_name":"Adaptability","score":0.572700023651123},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.5281000137329102},{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.5065000057220459},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.4616999924182892},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.3937999904155731},{"id":"https://openalex.org/keywords/emotional-expression","display_name":"Emotional expression","score":0.3763999938964844}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6794999837875366},{"id":"https://openalex.org/C2778152352","wikidata":"https://www.wikidata.org/wiki/Q5165061","display_name":"Content (measure theory)","level":2,"score":0.6039999723434448},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.5753999948501587},{"id":"https://openalex.org/C177606310","wikidata":"https://www.wikidata.org/wiki/Q5674297","display_name":"Adaptability","level":2,"score":0.572700023651123},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5658000111579895},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.5281000137329102},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.5065000057220459},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.4616999924182892},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4032000005245209},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.3937999904155731},{"id":"https://openalex.org/C143110190","wikidata":"https://www.wikidata.org/wiki/Q5373787","display_name":"Emotional expression","level":2,"score":0.3763999938964844},{"id":"https://openalex.org/C2780876879","wikidata":"https://www.wikidata.org/wiki/Q3054749","display_name":"Meaning (existential)","level":2,"score":0.3725000023841858},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3671000003814697},{"id":"https://openalex.org/C6438553","wikidata":"https://www.wikidata.org/wiki/Q1185804","display_name":"Affective computing","level":2,"score":0.3580000102519989},{"id":"https://openalex.org/C160086991","wikidata":"https://www.wikidata.org/wiki/Q5939193","display_name":"Human visual system model","level":3,"score":0.3504999876022339},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3131999969482422},{"id":"https://openalex.org/C90559484","wikidata":"https://www.wikidata.org/wiki/Q778379","display_name":"Expression (computer science)","level":2,"score":0.3118000030517578},{"id":"https://openalex.org/C2776141551","wikidata":"https://www.wikidata.org/wiki/Q16000087","display_name":"Emotion perception","level":3,"score":0.30239999294281006},{"id":"https://openalex.org/C162446236","wikidata":"https://www.wikidata.org/wiki/Q653137","display_name":"Content analysis","level":2,"score":0.2881999909877777},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.28600001335144043},{"id":"https://openalex.org/C206310091","wikidata":"https://www.wikidata.org/wiki/Q750859","display_name":"Emotion classification","level":2,"score":0.2815000116825104},{"id":"https://openalex.org/C178253425","wikidata":"https://www.wikidata.org/wiki/Q162668","display_name":"Visual perception","level":3,"score":0.27630001306533813},{"id":"https://openalex.org/C2778143943","wikidata":"https://www.wikidata.org/wiki/Q523747","display_name":"Expressed emotion","level":2,"score":0.2646999955177307},{"id":"https://openalex.org/C174348530","wikidata":"https://www.wikidata.org/wiki/Q188635","display_name":"Bridging (networking)","level":2,"score":0.263700008392334},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.25929999351501465},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.2533999979496002},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.25110000371932983}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2512.22437","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.22437","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2512.22437","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.22437","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"An":[0],"image":[1],"conveys":[2],"meaning":[3],"through":[4],"both":[5],"its":[6],"visual":[7,86,92],"content":[8,35,46,62,130],"and":[9,79,91,103,131,158],"emotional":[10,50],"tone,":[11],"jointly":[12],"shaping":[13],"human":[14,109,145],"perception.":[15],"We":[16],"introduce":[17,113],"Controllable":[18],"Emotional":[19],"Image":[20],"Content":[21],"Generation":[22],"(C-EICG),":[23],"which":[24],"aims":[25],"to":[26,32,85,151],"generate":[27,55],"images":[28],"that":[29,96,126],"remain":[30],"faithful":[31,129],"a":[33,39,73],"given":[34],"description":[36],"while":[37],"expressing":[38],"target":[40],"emotion.":[41],"Existing":[42],"text-to-image":[43],"models":[44,54],"ensure":[45],"consistency":[47],"but":[48],"lack":[49],"awareness,":[51],"whereas":[52],"emotion-driven":[53,115],"affective":[56,80,98],"results":[57],"at":[58],"the":[59,156,161],"cost":[60],"of":[61,160],"distortion.":[63],"To":[64,106],"address":[65],"this":[66],"gap,":[67],"we":[68,111],"propose":[69],"EmoCtrl,":[70],"supported":[71],"by":[72],"dataset":[74],"annotated":[75],"with":[76,108,118,144],"content,":[77],"emotion,":[78],"prompts,":[81],"bridging":[82],"abstract":[83],"emotions":[84],"cues.":[87,105],"EmoCtrl":[88,127,148],"incorporates":[89],"textual":[90],"emotion":[93,121,133,163],"enhancement":[94],"modules":[95],"enrich":[97],"expression":[99],"via":[100],"descriptive":[101],"semantics":[102],"perceptual":[104],"align":[107],"preference,":[110],"further":[112,154],"an":[114],"preference":[116],"optimization":[117],"specifically":[119],"designed":[120],"reward.":[122],"Comprehensive":[123],"experiments":[124],"demonstrate":[125],"achieves":[128],"expressive":[132],"control,":[134],"outperforming":[135],"existing":[136],"methods.":[137],"User":[138],"studies":[139],"confirm":[140],"EmoCtrl's":[141],"strong":[142],"alignment":[143],"preference.":[146],"Moreover,":[147],"generalizes":[149],"well":[150],"creative":[152],"applications,":[153],"demonstrating":[155],"robustness":[157],"adaptability":[159],"learned":[162],"tokens.":[164]},"counts_by_year":[],"updated_date":"2026-04-14T06:02:45.956762","created_date":"2025-12-31T00:00:00"}
