{"id":"https://openalex.org/W7134917718","doi":"https://doi.org/10.48550/arxiv.2603.08928","title":"TIDE: Text-Informed Dynamic Extrapolation with Step-Aware Temperature Control for Diffusion Transformers","display_name":"TIDE: Text-Informed Dynamic Extrapolation with Step-Aware Temperature Control for Diffusion Transformers","publication_year":2026,"publication_date":"2026-03-09","ids":{"openalex":"https://openalex.org/W7134917718","doi":"https://doi.org/10.48550/arxiv.2603.08928"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.08928","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.08928","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.08928","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5128723070","display_name":"Yihua Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Yihua","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128779504","display_name":"Fanjiang Ye","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ye, Fanjiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128791280","display_name":"Bowen Lin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lin, Bowen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010272260","display_name":"Rongyu Fang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fang, Rongyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5128787323","display_name":"Chengming Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Chengming","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.35089999437332153,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.35089999437332153,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.17100000381469727,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.1378999948501587,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/extrapolation","display_name":"Extrapolation","score":0.878000020980835},{"id":"https://openalex.org/keywords/sharpening","display_name":"Sharpening","score":0.526199996471405},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.4564000070095062},{"id":"https://openalex.org/keywords/temperature-measurement","display_name":"Temperature measurement","score":0.38850000500679016},{"id":"https://openalex.org/keywords/image-resolution","display_name":"Image resolution","score":0.3797999918460846},{"id":"https://openalex.org/keywords/temperature-control","display_name":"Temperature control","score":0.3776000142097473},{"id":"https://openalex.org/keywords/diffusion","display_name":"Diffusion","score":0.37599998712539673},{"id":"https://openalex.org/keywords/on-the-fly","display_name":"On the fly","score":0.3686000108718872}],"concepts":[{"id":"https://openalex.org/C132459708","wikidata":"https://www.wikidata.org/wiki/Q744069","display_name":"Extrapolation","level":2,"score":0.878000020980835},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6401000022888184},{"id":"https://openalex.org/C2781137444","wikidata":"https://www.wikidata.org/wiki/Q237105","display_name":"Sharpening","level":2,"score":0.526199996471405},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.4564000070095062},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4129999876022339},{"id":"https://openalex.org/C72293138","wikidata":"https://www.wikidata.org/wiki/Q909741","display_name":"Temperature measurement","level":2,"score":0.38850000500679016},{"id":"https://openalex.org/C205372480","wikidata":"https://www.wikidata.org/wiki/Q210521","display_name":"Image resolution","level":2,"score":0.3797999918460846},{"id":"https://openalex.org/C536315585","wikidata":"https://www.wikidata.org/wiki/Q7698332","display_name":"Temperature control","level":2,"score":0.3776000142097473},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.37599998712539673},{"id":"https://openalex.org/C2781020372","wikidata":"https://www.wikidata.org/wiki/Q533093","display_name":"On the fly","level":2,"score":0.3686000108718872},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.34630000591278076},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.3416000008583069},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.33820000290870667},{"id":"https://openalex.org/C3020199158","wikidata":"https://www.wikidata.org/wiki/Q210521","display_name":"High resolution","level":2,"score":0.33709999918937683},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.30709999799728394},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.30059999227523804},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.29910001158714294},{"id":"https://openalex.org/C119666444","wikidata":"https://www.wikidata.org/wiki/Q5977280","display_name":"Temporal resolution","level":2,"score":0.2937000095844269},{"id":"https://openalex.org/C138268822","wikidata":"https://www.wikidata.org/wiki/Q1051925","display_name":"Resolution (logic)","level":2,"score":0.2831999957561493},{"id":"https://openalex.org/C37404715","wikidata":"https://www.wikidata.org/wiki/Q380679","display_name":"Dynamic programming","level":2,"score":0.2799000144004822},{"id":"https://openalex.org/C24326235","wikidata":"https://www.wikidata.org/wiki/Q126095","display_name":"Electronic engineering","level":1,"score":0.2770000100135803},{"id":"https://openalex.org/C110384440","wikidata":"https://www.wikidata.org/wiki/Q1143270","display_name":"Upsampling","level":3,"score":0.26969999074935913}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.08928","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.08928","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.08928","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.08928","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/14","display_name":"Life below water","score":0.40102940797805786}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Diffusion":[0],"Transformer":[1],"(DiT)":[2],"faces":[3],"challenges":[4],"when":[5],"generating":[6],"images":[7],"with":[8,65,134],"higher":[9],"resolution":[10,67,128],"compared":[11],"at":[12],"training":[13],"resolution,":[14],"causing":[15],"especially":[16],"structural":[17],"degradation":[18],"due":[19],"to":[20,26,35,90],"attention":[21,31],"dilution.":[22],"Previous":[23],"approaches":[24],"attempt":[25],"mitigate":[27],"this":[28,45],"by":[29],"sharpening":[30],"distributions,":[32],"but":[33],"fail":[34],"preserve":[36],"fine-grained":[37],"semantic":[38],"details":[39],"and":[40,53,68,84,96,131],"introduce":[41,85],"obvious":[42],"artifacts.":[43],"In":[44],"work,":[46],"we":[47,103],"analyze":[48],"the":[49,77,92,112,118],"characteristics":[50],"of":[51,114],"DiTs":[52],"propose":[54],"TIDE,":[55],"a":[56,86,105],"training-free":[57],"text-to-image":[58],"(T2I)":[59],"extrapolation":[60,129],"method":[61],"that":[62,110,124],"enables":[63],"generation":[64],"arbitrary":[66],"aspect":[69],"ratio":[70],"without":[71],"additional":[72],"sampling":[73],"overhead.":[74],"We":[75],"identify":[76],"core":[78],"factor":[79],"for":[80],"prompt":[81],"information":[82],"loss,":[83],"text":[87,95],"anchoring":[88],"mechanism":[89,109],"correct":[91],"imbalance":[93],"between":[94],"image":[97],"tokens.":[98],"To":[99],"further":[100],"eliminate":[101],"artifacts,":[102],"design":[104],"dynamic":[106],"temperature":[107],"control":[108],"leverages":[111],"pattern":[113],"spectral":[115],"progression":[116],"in":[117],"diffusion":[119],"process.":[120],"Extensive":[121],"evaluations":[122],"demonstrate":[123],"TIDE":[125],"delivers":[126],"high-quality":[127],"capability":[130],"integrates":[132],"seamlessly":[133],"existing":[135],"state-of-the-art":[136],"methods.":[137]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-12T00:00:00"}
