{"id":"https://openalex.org/W7138155845","doi":"https://doi.org/10.1609/aaai.v40i4.37247","title":"RelaCtrl: Relevance-Guided Efficient Control for Diffusion Transformers","display_name":"RelaCtrl: Relevance-Guided Efficient Control for Diffusion Transformers","publication_year":2026,"publication_date":"2026-03-14","ids":{"openalex":"https://openalex.org/W7138155845","doi":"https://doi.org/10.1609/aaai.v40i4.37247"},"language":null,"primary_location":{"id":"doi:10.1609/aaai.v40i4.37247","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i4.37247","pdf_url":null,"source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://doi.org/10.1609/aaai.v40i4.37247","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Ke Cao","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Ke Cao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Jing Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jing Wang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Ao Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ao Ma","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Jiasong Feng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiasong Feng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Xuanhua He","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xuanhua He","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Run Ling","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Run Ling","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Haowei Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Haowei Liu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Jian Lu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jian Lu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Wei Feng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wei Feng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Haozhe Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Haozhe Wang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Hongjuan Pei","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hongjuan Pei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Yihua Shao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yihua Shao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Zhanjie Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhanjie Zhang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Jie Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jie Zhang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":14,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.44307469,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"40","issue":"4","first_page":"2598","last_page":"2606"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.7620000243186951,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.7620000243186951,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10481","display_name":"Computer Graphics and Visualization Techniques","score":0.028200000524520874,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.019899999722838402,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.6051999926567078},{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.39879998564720154},{"id":"https://openalex.org/keywords/relevance","display_name":"Relevance (law)","score":0.31380000710487366},{"id":"https://openalex.org/keywords/computational-complexity-theory","display_name":"Computational complexity theory","score":0.2842999994754791},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.2687999904155731}],"concepts":[{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.6051999926567078},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6040999889373779},{"id":"https://openalex.org/C24326235","wikidata":"https://www.wikidata.org/wiki/Q126095","display_name":"Electronic engineering","level":1,"score":0.4657000005245209},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.39879998564720154},{"id":"https://openalex.org/C200601418","wikidata":"https://www.wikidata.org/wiki/Q2193887","display_name":"Reliability engineering","level":1,"score":0.3246999979019165},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.31380000710487366},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.2842999994754791},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.2842999994754791},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.2687999904155731},{"id":"https://openalex.org/C51704429","wikidata":"https://www.wikidata.org/wiki/Q827792","display_name":"Quality control","level":3,"score":0.26510000228881836},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.25270000100135803},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.2513999938964844},{"id":"https://openalex.org/C17500928","wikidata":"https://www.wikidata.org/wiki/Q959968","display_name":"Control system","level":2,"score":0.25110000371932983}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1609/aaai.v40i4.37247","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i4.37247","pdf_url":null,"source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1609/aaai.v40i4.37247","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i4.37247","pdf_url":null,"source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Decent work and economic growth","score":0.4672267735004425,"id":"https://metadata.un.org/sdg/8"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0],"Diffusion":[1,76,88],"Transformer":[2,89],"plays":[3],"a":[4],"pivotal":[5],"role":[6],"in":[7,86,160],"advancing":[8],"text-to-image":[9],"and":[10,28,31,68,115,135,146,158,182,187,204],"text-to-video":[11],"generation,":[12],"owing":[13],"primarily":[14],"to":[15,38,41,90,142,150,208],"its":[16],"inherent":[17],"scalability.":[18],"However,":[19],"existing":[20],"controlled":[21],"diffusion":[22],"transformer":[23,52],"methods":[24],"incur":[25],"significant":[26],"parameter":[27,133],"computational":[29,205],"overheads":[30],"suffer":[32],"from":[33],"inefficient":[34],"resource":[35],"allocation":[36],"due":[37],"their":[39],"failure":[40],"account":[42],"for":[43],"the":[44,59,75,81,87,91,96,102,111,116,123,126,131,139,156,161,167,179,202],"varying":[45],"relevance":[46,82],"of":[47,71,83,104,113,125,138,177,201],"control":[48,72,92,107,117,140],"information":[49,93],"across":[50],"different":[51],"layers.":[53],"To":[54],"address":[55],"this,":[56],"we":[57,79,128,154],"propose":[58],"Relevance-Guided":[60],"Efficient":[61],"Controllable":[62],"Generation":[63],"framework,":[64],"RelaCtrl,":[65],"enabling":[66,174],"efficient":[67,175],"resource-optimized":[69],"integration":[70],"signals":[73],"into":[74],"Transformer.":[77],"First,":[78],"evaluate":[80],"each":[84,106],"layer":[85,108],"by":[94],"assessing":[95],"ControlNet":[97],"Relevance":[98],"Score,":[99],"which":[100],"measures":[101],"impact":[103],"skipping":[105],"on":[109,122],"both":[110,178],"quality":[112],"generation":[114],"effectiveness":[118],"during":[119],"inference.":[120],"Based":[121],"strength":[124],"relevance,":[127],"then":[129],"tailor":[130],"positioning,":[132],"scale,":[134],"modeling":[136],"capacity":[137],"layers":[141],"reduce":[143],"unnecessary":[144],"parameters":[145,203],"redundant":[147],"computations.":[148],"Additionally,":[149],"further":[151],"improve":[152],"efficiency,":[153],"replace":[155],"self-attention":[157],"FFN":[159],"commonly":[162],"used":[163],"copy":[164],"block":[165],"with":[166,198],"carefully":[168],"designed":[169],"Two-Dimensional":[170],"Shuffle":[171],"Mixer":[172],"(TDSM),":[173],"implementation":[176],"token":[180],"mixer":[181],"channel":[183],"mixer.":[184],"Both":[185],"qualitative":[186],"quantitative":[188],"experimental":[189],"results":[190],"demonstrate":[191],"that":[192],"our":[193],"approach":[194],"achieves":[195],"superior":[196],"performance":[197],"only":[199],"15%":[200],"complexity":[206],"compared":[207],"PixArt-delta.":[209]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2026-03-01T00:00:00"}
