{"id":"https://openalex.org/W7141681266","doi":"https://doi.org/10.48550/arxiv.2603.24800","title":"Calibri: Enhancing Diffusion Transformers via Parameter-Efficient Calibration","display_name":"Calibri: Enhancing Diffusion Transformers via Parameter-Efficient Calibration","publication_year":2026,"publication_date":"2026-03-25","ids":{"openalex":"https://openalex.org/W7141681266","doi":"https://doi.org/10.48550/arxiv.2603.24800"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.24800","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.24800","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.24800","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5130765427","display_name":"Danil Tokhchukov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tokhchukov, Danil","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130766713","display_name":"Aysel Mirzoeva","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mirzoeva, Aysel","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130779337","display_name":"Andrey Kuznetsov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kuznetsov, Andrey","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5075050471","display_name":"Konstantin Sobolev","orcid":"https://orcid.org/0000-0003-2969-3501"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sobolev, Konstantin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.8240000009536743,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.8240000009536743,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12611","display_name":"Neural Networks and Reservoir Computing","score":0.01549999974668026,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.01489999983459711,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/calibration","display_name":"Calibration","score":0.666700005531311},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.6421999931335449},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6279000043869019},{"id":"https://openalex.org/keywords/scaling","display_name":"Scaling","score":0.6068000197410583},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.3637000024318695},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.35839998722076416}],"concepts":[{"id":"https://openalex.org/C165838908","wikidata":"https://www.wikidata.org/wiki/Q736777","display_name":"Calibration","level":2,"score":0.666700005531311},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.6421999931335449},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6279000043869019},{"id":"https://openalex.org/C99844830","wikidata":"https://www.wikidata.org/wiki/Q102441924","display_name":"Scaling","level":2,"score":0.6068000197410583},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5241000056266785},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.38769999146461487},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3871999979019165},{"id":"https://openalex.org/C24326235","wikidata":"https://www.wikidata.org/wiki/Q126095","display_name":"Electronic engineering","level":1,"score":0.38589999079704285},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.3637000024318695},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.35839998722076416},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.3474000096321106},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.3416000008583069},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.3352000117301941},{"id":"https://openalex.org/C2987595161","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Optimization algorithm","level":2,"score":0.31040000915527344},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.29319998621940613},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.28999999165534973},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.27489998936653137},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2689000070095062}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.24800","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.24800","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.24800","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.24800","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"In":[0],"this":[1,44],"paper,":[2],"we":[3,25,46],"uncover":[4],"the":[5,22,37,104],"hidden":[6],"potential":[7],"of":[8,21,39],"Diffusion":[9],"Transformers":[10],"(DiTs)":[11],"to":[12,57],"significantly":[13,35],"enhance":[14],"generative":[15,59],"tasks.":[16],"Through":[17],"an":[18,76],"in-depth":[19],"analysis":[20],"denoising":[23],"process,":[24],"demonstrate":[26],"that":[27,52,87],"introducing":[28],"a":[29,49,66],"single":[30],"learned":[31],"scaling":[32],"parameter":[33],"can":[34],"improve":[36],"performance":[38,95],"DiT":[40,55,63],"blocks.":[41],"Building":[42],"on":[43],"insight,":[45],"propose":[47],"Calibri,":[48],"parameter-efficient":[50],"approach":[51],"optimally":[53],"calibrates":[54],"components":[56],"elevate":[58],"quality.":[60],"Calibri":[61,92,101],"frames":[62],"calibration":[64],"as":[65],"black-box":[67],"reward":[68],"optimization":[69],"problem,":[70],"which":[71],"is":[72],"efficiently":[73],"solved":[74],"using":[75],"evolutionary":[77],"algorithm":[78],"and":[79],"modifies":[80],"just":[81],"~100":[82],"parameters.":[83],"Experimental":[84],"results":[85],"reveal":[86],"despite":[88],"its":[89],"lightweight":[90],"design,":[91],"consistently":[93],"improves":[94],"across":[96],"various":[97],"text-to-image":[98],"models.":[99],"Notably,":[100],"also":[102],"reduces":[103],"inference":[105],"steps":[106],"required":[107],"for":[108],"image":[109],"generation,":[110],"all":[111],"while":[112],"maintaining":[113],"high-quality":[114],"outputs.":[115]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-28T00:00:00"}
