{"id":"https://openalex.org/W7133343244","doi":"https://doi.org/10.48550/arxiv.2603.00589","title":"AlignVAR: Towards Globally Consistent Visual Autoregression for Image Super-Resolution","display_name":"AlignVAR: Towards Globally Consistent Visual Autoregression for Image Super-Resolution","publication_year":2026,"publication_date":"2026-02-28","ids":{"openalex":"https://openalex.org/W7133343244","doi":"https://doi.org/10.48550/arxiv.2603.00589"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2603.00589","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5074172920","display_name":"Cencen Liu","orcid":"https://orcid.org/0009-0004-8162-7071"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Liu, Cencen","raw_affiliation_strings":["University of Electronic Science and Technology of China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Electronic Science and Technology of China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128026286","display_name":"Dongyang Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]},{"id":"https://openalex.org/I4210102840","display_name":"Ubiquitous Energy (United States)","ror":"https://ror.org/01b06j989","country_code":"US","type":"company","lineage":["https://openalex.org/I4210102840"]}],"countries":["CN","US"],"is_corresponding":false,"raw_author_name":"Zhang, Dongyang","raw_affiliation_strings":["University of Electronic Science and Technology of China","Ubiquitous Intelligence and Trusted Services Key Laboratory of Sichuan Province"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Electronic Science and Technology of China","institution_ids":["https://openalex.org/I150229711"]},{"raw_affiliation_string":"Ubiquitous Intelligence and Trusted Services Key Laboratory of Sichuan Province","institution_ids":["https://openalex.org/I4210102840"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071889563","display_name":"Wen Yin","orcid":"https://orcid.org/0000-0001-7447-9905"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yin, Wen","raw_affiliation_strings":["University of Electronic Science and Technology of China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Electronic Science and Technology of China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043163390","display_name":"Jielei Wang","orcid":"https://orcid.org/0000-0003-2882-7053"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]},{"id":"https://openalex.org/I4210102840","display_name":"Ubiquitous Energy (United States)","ror":"https://ror.org/01b06j989","country_code":"US","type":"company","lineage":["https://openalex.org/I4210102840"]}],"countries":["CN","US"],"is_corresponding":false,"raw_author_name":"Wang, Jielei","raw_affiliation_strings":["University of Electronic Science and Technology of China","Ubiquitous Intelligence and Trusted Services Key Laboratory of Sichuan Province"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Electronic Science and Technology of China","institution_ids":["https://openalex.org/I150229711"]},{"raw_affiliation_string":"Ubiquitous Intelligence and Trusted Services Key Laboratory of Sichuan Province","institution_ids":["https://openalex.org/I4210102840"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127916129","display_name":"Tianyu Li","orcid":null},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Li, Tianyu","raw_affiliation_strings":["University of Electronic Science and Technology of China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Electronic Science and Technology of China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017191320","display_name":"Ji Guo","orcid":"https://orcid.org/0009-0008-8990-436X"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guo, Ji","raw_affiliation_strings":["University of Electronic Science and Technology of China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Electronic Science and Technology of China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044354150","display_name":"W. L. Jiang","orcid":null},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiang, Wenbo","raw_affiliation_strings":["University of Electronic Science and Technology of China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Electronic Science and Technology of China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100334012","display_name":"Guoqing Wang","orcid":"https://orcid.org/0000-0001-9326-3755"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wang, Guoqing","raw_affiliation_strings":["University of Electronic Science and Technology of China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Electronic Science and Technology of China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5127967956","display_name":"Guoming Lu","orcid":null},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]},{"id":"https://openalex.org/I4210102840","display_name":"Ubiquitous Energy (United States)","ror":"https://ror.org/01b06j989","country_code":"US","type":"company","lineage":["https://openalex.org/I4210102840"]}],"countries":["CN","US"],"is_corresponding":false,"raw_author_name":"Lu, Guoming","raw_affiliation_strings":["University of Electronic Science and Technology of China","Ubiquitous Intelligence and Trusted Services Key Laboratory of Sichuan Province"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Electronic Science and Technology of China","institution_ids":["https://openalex.org/I150229711"]},{"raw_affiliation_string":"Ubiquitous Intelligence and Trusted Services Key Laboratory of Sichuan Province","institution_ids":["https://openalex.org/I4210102840"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":9,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.5921000242233276,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.5921000242233276,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.34360000491142273,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.008100000210106373,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/autoregressive-model","display_name":"Autoregressive model","score":0.7996000051498413},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.6265000104904175},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.49149999022483826},{"id":"https://openalex.org/keywords/constraint","display_name":"Constraint (computer-aided design)","score":0.47600001096725464},{"id":"https://openalex.org/keywords/locality","display_name":"Locality","score":0.42590001225471497},{"id":"https://openalex.org/keywords/vector-autoregression","display_name":"Vector autoregression","score":0.4237000048160553},{"id":"https://openalex.org/keywords/residual","display_name":"Residual","score":0.420199990272522},{"id":"https://openalex.org/keywords/fidelity","display_name":"Fidelity","score":0.413100004196167},{"id":"https://openalex.org/keywords/local-consistency","display_name":"Local consistency","score":0.4072999954223633}],"concepts":[{"id":"https://openalex.org/C159877910","wikidata":"https://www.wikidata.org/wiki/Q2202883","display_name":"Autoregressive model","level":2,"score":0.7996000051498413},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.6265000104904175},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5932999849319458},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5825999975204468},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.49149999022483826},{"id":"https://openalex.org/C2776036281","wikidata":"https://www.wikidata.org/wiki/Q48769818","display_name":"Constraint (computer-aided design)","level":2,"score":0.47600001096725464},{"id":"https://openalex.org/C2779808786","wikidata":"https://www.wikidata.org/wiki/Q6664603","display_name":"Locality","level":2,"score":0.42590001225471497},{"id":"https://openalex.org/C133029050","wikidata":"https://www.wikidata.org/wiki/Q385593","display_name":"Vector autoregression","level":2,"score":0.4237000048160553},{"id":"https://openalex.org/C155512373","wikidata":"https://www.wikidata.org/wiki/Q287450","display_name":"Residual","level":2,"score":0.420199990272522},{"id":"https://openalex.org/C2776459999","wikidata":"https://www.wikidata.org/wiki/Q2119376","display_name":"Fidelity","level":2,"score":0.413100004196167},{"id":"https://openalex.org/C137105694","wikidata":"https://www.wikidata.org/wiki/Q3407510","display_name":"Local consistency","level":4,"score":0.4072999954223633},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3928999900817871},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.383899986743927},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3781999945640564},{"id":"https://openalex.org/C2781181686","wikidata":"https://www.wikidata.org/wiki/Q4226068","display_name":"Coherence (philosophical gambling strategy)","level":2,"score":0.3675999939441681},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.36570000648498535},{"id":"https://openalex.org/C149782125","wikidata":"https://www.wikidata.org/wiki/Q160039","display_name":"Econometrics","level":1,"score":0.33500000834465027},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3244999945163727},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.31690001487731934},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.305400013923645},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.3041999936103821},{"id":"https://openalex.org/C2780992000","wikidata":"https://www.wikidata.org/wiki/Q17016113","display_name":"Generator (circuit theory)","level":3,"score":0.2953000068664551},{"id":"https://openalex.org/C137703641","wikidata":"https://www.wikidata.org/wiki/Q4874480","display_name":"Bayesian vector autoregression","level":3,"score":0.29499998688697815},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.28619998693466187},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.2734000086784363},{"id":"https://openalex.org/C106430172","wikidata":"https://www.wikidata.org/wiki/Q6002272","display_name":"Image restoration","level":4,"score":0.2660999894142151},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.25099998712539673}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2603.00589","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2603.00589","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.00589","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2603.00589","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Visual":[0],"autoregressive":[1,77],"(VAR)":[2],"models":[3],"have":[4],"recently":[5],"emerged":[6],"as":[7],"a":[8,73,170],"promising":[9],"alternative":[10],"for":[11,31,80,173],"image":[12,32],"generation,":[13],"offering":[14],"stable":[15],"training,":[16],"non-iterative":[17],"inference,":[18],"and":[19,40,51,107,111,132,147],"high-fidelity":[20],"synthesis":[21],"through":[22],"next-scale":[23],"prediction.":[24],"This":[25],"encourages":[26],"the":[27,134],"exploration":[28],"of":[29,63],"VAR":[30],"super-resolution":[33],"(ISR),":[34],"yet":[35],"its":[36],"application":[37],"remains":[38],"underexplored":[39],"faces":[41],"two":[42,83],"critical":[43],"challenges:":[44],"locality-biased":[45],"attention,":[46],"which":[47,54,91,117],"fragments":[48],"spatial":[49],"structures,":[50],"residual-only":[52],"supervision,":[53],"accumulates":[55],"errors":[56],"across":[57],"scales,":[58],"severely":[59],"compromises":[60],"global":[61],"consistency":[62],"reconstructed":[64],"images.":[65],"To":[66],"address":[67],"these":[68],"issues,":[69],"we":[70],"propose":[71],"AlignVAR,":[72],"globally":[74],"consistent":[75],"visual":[76],"framework":[78],"tailored":[79],"ISR,":[81],"featuring":[82],"key":[84],"components:":[85],"(1)":[86],"Spatial":[87],"Consistency":[88,114],"Autoregression":[89],"(SCA),":[90],"applies":[92],"an":[93],"adaptive":[94],"mask":[95],"to":[96],"reweight":[97],"attention":[98],"toward":[99],"structurally":[100],"correlated":[101],"regions,":[102],"thereby":[103],"mitigating":[104],"excessive":[105],"locality":[106],"enhancing":[108],"long-range":[109],"dependencies;":[110],"(2)":[112],"Hierarchical":[113],"Constraint":[115],"(HCC),":[116],"augments":[118],"residual":[119],"learning":[120],"with":[121,160],"full":[122],"reconstruction":[123],"supervision":[124],"at":[125],"each":[126],"scale,":[127],"exposing":[128],"accumulated":[129],"deviations":[130],"early":[131],"stabilizing":[133],"coarse-to-fine":[135],"refinement":[136],"process.":[137],"Extensive":[138],"experiments":[139],"demonstrate":[140],"that":[141],"AlignVAR":[142],"consistently":[143],"enhances":[144],"structural":[145],"coherence":[146],"perceptual":[148],"fidelity":[149],"over":[150,156],"existing":[151],"generative":[152],"methods,":[153],"while":[154],"delivering":[155],"10x":[157],"faster":[158],"inference":[159],"nearly":[161],"50%":[162],"fewer":[163],"parameters":[164],"than":[165],"leading":[166],"diffusion-based":[167],"approaches,":[168],"establishing":[169],"new":[171],"paradigm":[172],"efficient":[174],"ISR.":[175]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-04T00:00:00"}
