{"id":"https://openalex.org/W7147142811","doi":"https://doi.org/10.48550/arxiv.2603.27666","title":"Gated Condition Injection without Multimodal Attention: Towards Controllable Linear-Attention Transformers","display_name":"Gated Condition Injection without Multimodal Attention: Towards Controllable Linear-Attention Transformers","publication_year":2026,"publication_date":"2026-03-29","ids":{"openalex":"https://openalex.org/W7147142811","doi":"https://doi.org/10.48550/arxiv.2603.27666"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.27666","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.27666","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.27666","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5055720148","display_name":"Yuhe Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Yuhe","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132583911","display_name":"Zhenxiong Tan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tan, Zhenxiong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132546998","display_name":"Yujia Hu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Yujia","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132609387","display_name":"Songhua Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Songhua","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5132656720","display_name":"Xinchao Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Xinchao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.26649999618530273,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.26649999618530273,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.17759999632835388,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.08250000327825546,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6694999933242798},{"id":"https://openalex.org/keywords/flexibility","display_name":"Flexibility (engineering)","score":0.5856999754905701},{"id":"https://openalex.org/keywords/server","display_name":"Server","score":0.5116000175476074},{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.4821000099182129},{"id":"https://openalex.org/keywords/high-fidelity","display_name":"High fidelity","score":0.4530999958515167},{"id":"https://openalex.org/keywords/fidelity","display_name":"Fidelity","score":0.43650001287460327},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.3646000027656555}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7427999973297119},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6694999933242798},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.5856999754905701},{"id":"https://openalex.org/C93996380","wikidata":"https://www.wikidata.org/wiki/Q44127","display_name":"Server","level":2,"score":0.5116000175476074},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.49070000648498535},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.4821000099182129},{"id":"https://openalex.org/C113364801","wikidata":"https://www.wikidata.org/wiki/Q26674","display_name":"High fidelity","level":2,"score":0.4530999958515167},{"id":"https://openalex.org/C2776459999","wikidata":"https://www.wikidata.org/wiki/Q2119376","display_name":"Fidelity","level":2,"score":0.43650001287460327},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.3646000027656555},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.3366999924182892},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.3357999920845032},{"id":"https://openalex.org/C138236772","wikidata":"https://www.wikidata.org/wiki/Q25098575","display_name":"Edge device","level":3,"score":0.33559998869895935},{"id":"https://openalex.org/C2778456923","wikidata":"https://www.wikidata.org/wiki/Q5337692","display_name":"Edge computing","level":3,"score":0.313400000333786},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.28630000352859497},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.25920000672340393},{"id":"https://openalex.org/C24326235","wikidata":"https://www.wikidata.org/wiki/Q126095","display_name":"Electronic engineering","level":1,"score":0.2590999901294708},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.257099986076355}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.27666","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.27666","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.27666","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.27666","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Recent":[0],"advances":[1],"in":[2,12,47,125,132,172],"diffusion-based":[3],"controllable":[4,50,74,109,162],"visual":[5],"generation":[6,75,163],"have":[7],"led":[8],"to":[9,26,86],"remarkable":[10],"improvements":[11],"image":[13],"quality.":[14],"However,":[15],"these":[16,103],"powerful":[17],"models":[18,52],"are":[19],"typically":[20],"deployed":[21],"on":[22,65,97,151,166],"cloud":[23],"servers":[24],"due":[25],"their":[27],"large":[28],"computational":[29],"demands,":[30],"raising":[31],"serious":[32],"concerns":[33],"about":[34],"user":[35],"data":[36],"privacy.":[37],"To":[38,101],"enable":[39],"secure":[40],"and":[41,62,80,146,154,176],"efficient":[42],"on-device":[43],"generation,":[44],"we":[45,105],"explore":[46],"this":[48],"paper":[49],"diffusion":[51,110],"built":[53],"upon":[54],"linear":[55,114],"attention":[56,115],"architectures,":[57],"which":[58,136],"offer":[59],"superior":[60],"scalability":[61],"efficiency,":[63],"even":[64],"edge":[66],"devices.":[67],"Yet,":[68],"our":[69,122,158],"experiments":[70,150],"reveal":[71],"that":[72,157],"existing":[73,170],"frameworks,":[76],"such":[77,98,142],"as":[78,143],"ControlNet":[79],"OminiControl,":[81],"either":[82],"lack":[83],"the":[84],"flexibility":[85],"support":[87],"multiple":[88,152],"heterogeneous":[89],"condition":[90],"types":[91],"or":[92],"suffer":[93],"from":[94],"slow":[95],"convergence":[96],"linear-attention":[99,167],"models.":[100],"address":[102],"limitations,":[104],"propose":[106],"a":[107,126,133],"novel":[108],"framework":[111],"tailored":[112],"for":[113],"backbones":[116],"like":[117],"SANA.":[118],"The":[119],"core":[120],"of":[121,174],"method":[123],"lies":[124],"unified":[127],"gated":[128],"conditioning":[129],"module":[130],"working":[131],"dual-path":[134],"pipeline,":[135],"effectively":[137],"integrates":[138],"multi-type":[139],"conditional":[140],"inputs,":[141],"spatially":[144],"aligned":[145],"non-aligned":[147],"cues.":[148],"Extensive":[149],"tasks":[153],"benchmarks":[155],"demonstrate":[156],"approach":[159],"achieves":[160],"state-of-the-art":[161],"performance":[164],"based":[165],"models,":[168],"surpassing":[169],"methods":[171],"terms":[173],"fidelity":[175],"controllability.":[177]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-02T00:00:00"}
