{"id":"https://openalex.org/W7139125977","doi":"https://doi.org/10.48550/arxiv.2603.17944","title":"TransText: Alpha-as-RGB Representation for Transparent Text Animation","display_name":"TransText: Alpha-as-RGB Representation for Transparent Text Animation","publication_year":2026,"publication_date":"2026-03-18","ids":{"openalex":"https://openalex.org/W7139125977","doi":"https://doi.org/10.48550/arxiv.2603.17944"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.17944","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.17944","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.17944","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5129784232","display_name":"Fei Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zhang, Fei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130209730","display_name":"Zijian Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Zijian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130045760","display_name":"Bohao Tang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tang, Bohao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130124130","display_name":"Sen He","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"He, Sen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129904794","display_name":"Hang Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Hang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129876217","display_name":"Zhe Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Zhe","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068643077","display_name":"Soubhik Sanyal","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sanyal, Soubhik","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129973221","display_name":"Pengfei Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Pengfei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048585869","display_name":"Viktar Atliha","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Atliha, Viktar","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130209049","display_name":"Tao Xiang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiang, Tao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129991194","display_name":"Frost Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Frost","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5042454355","display_name":"Semih G\u00fcnel","orcid":"https://orcid.org/0000-0002-0863-8928"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gunel, Semih","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":12,"corresponding_author_ids":["https://openalex.org/A5129784232"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.8263000249862671,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.8263000249862671,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10481","display_name":"Computer Graphics and Visualization Techniques","score":0.0272000003606081,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.023900000378489494,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/transparency","display_name":"Transparency (behavior)","score":0.6995000243186951},{"id":"https://openalex.org/keywords/autoencoder","display_name":"Autoencoder","score":0.5473999977111816},{"id":"https://openalex.org/keywords/animation","display_name":"Animation","score":0.47679999470710754},{"id":"https://openalex.org/keywords/rgb-color-model","display_name":"RGB color model","score":0.460099995136261},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4440999925136566},{"id":"https://openalex.org/keywords/toolbox","display_name":"Toolbox","score":0.4311000108718872},{"id":"https://openalex.org/keywords/prior-probability","display_name":"Prior probability","score":0.38339999318122864},{"id":"https://openalex.org/keywords/skew","display_name":"Skew","score":0.3662000000476837},{"id":"https://openalex.org/keywords/glyph","display_name":"Glyph (data visualization)","score":0.3650999963283539},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.3546999990940094}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8062999844551086},{"id":"https://openalex.org/C2780233690","wikidata":"https://www.wikidata.org/wiki/Q535347","display_name":"Transparency (behavior)","level":2,"score":0.6995000243186951},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6330000162124634},{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.5473999977111816},{"id":"https://openalex.org/C502989409","wikidata":"https://www.wikidata.org/wiki/Q11425","display_name":"Animation","level":2,"score":0.47679999470710754},{"id":"https://openalex.org/C82990744","wikidata":"https://www.wikidata.org/wiki/Q166194","display_name":"RGB color model","level":2,"score":0.460099995136261},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4440999925136566},{"id":"https://openalex.org/C2777655017","wikidata":"https://www.wikidata.org/wiki/Q1501161","display_name":"Toolbox","level":2,"score":0.4311000108718872},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.39480000734329224},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.38339999318122864},{"id":"https://openalex.org/C43711488","wikidata":"https://www.wikidata.org/wiki/Q7534783","display_name":"Skew","level":2,"score":0.3662000000476837},{"id":"https://openalex.org/C142816647","wikidata":"https://www.wikidata.org/wiki/Q5573018","display_name":"Glyph (data visualization)","level":3,"score":0.3650999963283539},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.3546999990940094},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.35339999198913574},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.35269999504089355},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.35089999437332153},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.3434999883174896},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.33899998664855957},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.3375000059604645},{"id":"https://openalex.org/C33676613","wikidata":"https://www.wikidata.org/wiki/Q13415176","display_name":"Dimension (graph theory)","level":2,"score":0.33379998803138733},{"id":"https://openalex.org/C2780575108","wikidata":"https://www.wikidata.org/wiki/Q7316652","display_name":"Retargeting","level":2,"score":0.32820001244544983},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3082999885082245},{"id":"https://openalex.org/C113954288","wikidata":"https://www.wikidata.org/wiki/Q186885","display_name":"Timestamp","level":2,"score":0.30329999327659607},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.29750001430511475},{"id":"https://openalex.org/C2779231336","wikidata":"https://www.wikidata.org/wiki/Q7534724","display_name":"Sketch","level":2,"score":0.2858000099658966},{"id":"https://openalex.org/C40305131","wikidata":"https://www.wikidata.org/wiki/Q2616305","display_name":"Obfuscation","level":2,"score":0.2825999855995178},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.27880001068115234},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.2745000123977661},{"id":"https://openalex.org/C155846161","wikidata":"https://www.wikidata.org/wiki/Q1143367","display_name":"Graphical model","level":2,"score":0.27379998564720154},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.26660001277923584},{"id":"https://openalex.org/C61423126","wikidata":"https://www.wikidata.org/wiki/Q187432","display_name":"Scripting language","level":2,"score":0.2630999982357025},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.2624000012874603},{"id":"https://openalex.org/C70518039","wikidata":"https://www.wikidata.org/wiki/Q16000077","display_name":"Dimensionality reduction","level":2,"score":0.2597000002861023},{"id":"https://openalex.org/C106301342","wikidata":"https://www.wikidata.org/wiki/Q4117933","display_name":"Entropy (arrow of time)","level":2,"score":0.25859999656677246},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2500999867916107}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.17944","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.17944","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.17944","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.17944","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"We":[0],"introduce":[1],"the":[2,6,32,43,47,50,58,66,74,112,118],"first":[3],"method,":[4],"to":[5,15,42,85,104],"best":[7],"of":[8,49,60],"our":[9],"knowledge,":[10],"for":[11,23],"adapting":[12],"image-to-video":[13],"models":[14],"layer-aware":[16],"text":[17],"(glyph)":[18],"animation,":[19],"a":[20,96,100],"capability":[21],"critical":[22],"practical":[24],"dynamic":[25],"visual":[26,124],"design.":[27],"Existing":[28],"approaches":[29],"predominantly":[30],"handle":[31],"transparency-encoding":[33],"(alpha":[34],"channel)":[35],"as":[36,121],"an":[37,122],"extra":[38],"latent":[39,86,127],"dimension":[40],"appended":[41],"RGB":[44,81],"space,":[45],"necessitating":[46],"reconstruction":[48],"underlying":[51],"RGB-centric":[52],"variational":[53],"autoencoder":[54],"(VAE).":[55],"However,":[56],"given":[57],"scarcity":[59],"high-quality":[61],"transparent":[62,151],"glyph":[63],"data,":[64],"retraining":[65],"VAE":[67],"is":[68],"computationally":[69],"expensive":[70],"and":[71,108],"may":[72],"erode":[73],"robust":[75],"semantic":[76],"priors":[77],"learned":[78],"from":[79],"massive":[80],"corpora,":[82],"potentially":[83],"leading":[84],"pattern":[87],"mixing.":[88],"To":[89],"mitigate":[90],"these":[91],"limitations,":[92],"we":[93],"propose":[94],"TransText,":[95],"framework":[97],"based":[98],"on":[99],"novel":[101],"Alpha-as-RGB":[102],"paradigm":[103],"jointly":[105],"model":[106],"appearance":[107],"transparency":[109],"without":[110],"modifying":[111],"pre-trained":[113],"generative":[114],"manifold.":[115],"TransText":[116,144],"embeds":[117],"alpha":[119],"channel":[120],"RGB-compatible":[123],"signal":[125],"through":[126],"spatial":[128],"concatenation,":[129],"explicitly":[130],"ensuring":[131],"strict":[132],"cross-modal":[133],"(RGB-and-Alpha)":[134],"consistency":[135],"while":[136],"preventing":[137],"feature":[138],"entanglement.":[139],"Our":[140],"experiments":[141],"demonstrate":[142],"that":[143],"significantly":[145],"outperforms":[146],"baselines,":[147],"generating":[148],"coherent,":[149],"high-fidelity":[150],"animations":[152],"with":[153],"diverse,":[154],"fine-grained":[155],"effects.":[156]},"counts_by_year":[],"updated_date":"2026-03-21T06:30:42.041108","created_date":"2026-03-20T00:00:00"}
