{"id":"https://openalex.org/W7108228537","doi":"https://doi.org/10.48550/arxiv.2511.22991","title":"Guiding Visual Autoregressive Models through Spectrum Weakening","display_name":"Guiding Visual Autoregressive Models through Spectrum Weakening","publication_year":2025,"publication_date":"2025-11-28","ids":{"openalex":"https://openalex.org/W7108228537","doi":"https://doi.org/10.48550/arxiv.2511.22991"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2511.22991","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2511.22991","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2511.22991","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Wang, Chaoyang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Wang, Chaoyang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Yang, Tianmeng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Tianmeng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Wang, Jingdong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Jingdong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Tong, Yunhai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tong, Yunhai","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.3212999999523163,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.3212999999523163,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.2093999981880188,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.0348999984562397,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/autoregressive-model","display_name":"Autoregressive model","score":0.684499979019165},{"id":"https://openalex.org/keywords/stability","display_name":"Stability (learning theory)","score":0.6080999970436096},{"id":"https://openalex.org/keywords/spectrum","display_name":"Spectrum (functional analysis)","score":0.5756999850273132},{"id":"https://openalex.org/keywords/dimension","display_name":"Dimension (graph theory)","score":0.5705999732017517},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.49309998750686646},{"id":"https://openalex.org/keywords/invertible-matrix","display_name":"Invertible matrix","score":0.4357999861240387},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.4099000096321106}],"concepts":[{"id":"https://openalex.org/C159877910","wikidata":"https://www.wikidata.org/wiki/Q2202883","display_name":"Autoregressive model","level":2,"score":0.684499979019165},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.6080999970436096},{"id":"https://openalex.org/C156778621","wikidata":"https://www.wikidata.org/wiki/Q1365748","display_name":"Spectrum (functional analysis)","level":2,"score":0.5756999850273132},{"id":"https://openalex.org/C33676613","wikidata":"https://www.wikidata.org/wiki/Q13415176","display_name":"Dimension (graph theory)","level":2,"score":0.5705999732017517},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.49309998750686646},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.4652000069618225},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4498000144958496},{"id":"https://openalex.org/C96442724","wikidata":"https://www.wikidata.org/wiki/Q242188","display_name":"Invertible matrix","level":2,"score":0.4357999861240387},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4284000098705292},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.4099000096321106},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.40939998626708984},{"id":"https://openalex.org/C164380108","wikidata":"https://www.wikidata.org/wiki/Q507187","display_name":"Attractor","level":2,"score":0.4065999984741211},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.3991999924182892},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.35280001163482666},{"id":"https://openalex.org/C36299963","wikidata":"https://www.wikidata.org/wiki/Q1369844","display_name":"Observability","level":2,"score":0.3481000065803528},{"id":"https://openalex.org/C93959086","wikidata":"https://www.wikidata.org/wiki/Q6888345","display_name":"Model selection","level":2,"score":0.3206999897956848},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.31130000948905945},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.2994000017642975},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2937999963760376},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.2912999987602234},{"id":"https://openalex.org/C55689738","wikidata":"https://www.wikidata.org/wiki/Q15963867","display_name":"Discrete time and continuous time","level":2,"score":0.2718000113964081}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2511.22991","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2511.22991","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2511.22991","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2511.22991","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Classifier-free":[0],"guidance":[1,23],"(CFG)":[2],"has":[3],"become":[4],"a":[5,45,72,93],"widely":[6],"adopted":[7],"and":[8,15,147],"practical":[9],"approach":[10],"for":[11,25,48,59,171],"enhancing":[12],"generation":[13,165],"quality":[14],"improving":[16],"condition":[17],"alignment.":[18],"Recent":[19],"studies":[20],"have":[21],"explored":[22],"mechanisms":[24],"unconditional":[26,164],"generation,":[27],"yet":[28],"these":[29],"approaches":[30],"remain":[31],"fundamentally":[32],"tied":[33],"to":[34,37],"assumptions":[35],"specific":[36,61],"diffusion":[38,123],"models.":[39,52,124],"In":[40],"this":[41,69,103],"work,":[42],"we":[43,105],"propose":[44],"spectrum-weakening":[46],"framework":[47],"visual":[49],"autoregressive":[50],"(AR)":[51],"This":[53],"method":[54,161],"works":[55],"without":[56],"the":[57,77,110,118,137],"need":[58],"re-training,":[60],"conditions,":[62],"or":[63,153],"any":[64],"architectural":[65],"modifications.":[66],"It":[67],"achieves":[68],"by":[70,122],"constructing":[71],"controllable":[73],"weak":[74],"model":[75],"in":[76],"spectral":[78,85],"domain.":[79],"We":[80,125],"theoretically":[81],"show":[82],"that":[83,132,159],"invertible":[84],"transformations":[86],"preserve":[87],"information,":[88],"while":[89,166],"selectively":[90],"retaining":[91],"only":[92],"subset":[94],"of":[95,113],"spectrum":[96,107,129],"introduces":[97],"controlled":[98],"information":[99],"reduction.":[100],"Based":[101],"on":[102,144],"insight,":[104],"perform":[106],"selection":[108],"along":[109],"channel":[111],"dimension":[112],"internal":[114],"representations,":[115],"which":[116],"avoids":[117],"structural":[119],"constraints":[120],"imposed":[121],"further":[126],"introduce":[127],"two":[128],"renormalization":[130],"strategies":[131],"ensures":[133],"numerical":[134],"stability":[135],"during":[136],"weakening":[138],"process.":[139],"Extensive":[140],"experiments":[141],"were":[142],"conducted":[143],"both":[145],"discrete":[146],"continuous":[148],"AR":[149],"models,":[150],"with":[151],"text":[152],"class":[154],"conditioning.":[155],"The":[156],"results":[157],"demonstrate":[158],"our":[160],"enables":[162],"high-quality":[163],"maintaining":[167],"strong":[168],"prompt":[169],"alignment":[170],"conditional":[172],"generation.":[173]},"counts_by_year":[],"updated_date":"2025-12-03T00:07:38.036990","created_date":"2025-12-03T00:00:00"}
