{"id":"https://openalex.org/W7127684467","doi":"https://doi.org/10.48550/arxiv.2602.03753","title":"Test-Time Conditioning with Representation-Aligned Visual Features","display_name":"Test-Time Conditioning with Representation-Aligned Visual Features","publication_year":2026,"publication_date":"2026-02-03","ids":{"openalex":"https://openalex.org/W7127684467","doi":"https://doi.org/10.48550/arxiv.2602.03753"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.03753","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5114424071","display_name":"Nicolas Sereyjol-Garros","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Sereyjol-Garros, Nicolas","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065239235","display_name":"Ellington Kirby","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kirby, Ellington","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5093192294","display_name":"Victor Letzelter","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Letzelter, Victor","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125028051","display_name":"Victor Besnier","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Besnier, Victor","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5070720681","display_name":"Nermin Samet","orcid":"https://orcid.org/0000-0001-9247-2504"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Samet, Nermin","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5114424071"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.7767000198364258,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.7767000198364258,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.08699999749660492,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11304","display_name":"Advanced Neuroimaging Techniques and Applications","score":0.02410000003874302,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.6626999974250793},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.6237999796867371},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.5720000267028809},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5652999877929688},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5457000136375427},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.4999000132083893},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4925000071525574},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.41359999775886536},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.4023999869823456}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7297000288963318},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7077000141143799},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.6626999974250793},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.6237999796867371},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.5720000267028809},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5652999877929688},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5457000136375427},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.4999000132083893},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4925000071525574},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.41359999775886536},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.4023999869823456},{"id":"https://openalex.org/C2781122975","wikidata":"https://www.wikidata.org/wiki/Q16928266","display_name":"Semantic feature","level":2,"score":0.3968000113964081},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.38269999623298645},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.36250001192092896},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.3571999967098236},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.35659998655319214},{"id":"https://openalex.org/C115051666","wikidata":"https://www.wikidata.org/wiki/Q6522493","display_name":"Ranging","level":2,"score":0.3564000129699707},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.35179999470710754},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3456999957561493},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.3393999934196472},{"id":"https://openalex.org/C45262634","wikidata":"https://www.wikidata.org/wiki/Q5159291","display_name":"Conditioning","level":2,"score":0.3301999866962433},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.2964000105857849},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.2849999964237213},{"id":"https://openalex.org/C2983787585","wikidata":"https://www.wikidata.org/wiki/Q93586","display_name":"Feature matching","level":3,"score":0.2770000100135803},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.27320000529289246},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.26750001311302185}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.03753","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.03753","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.03753","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.03753","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"While":[0],"representation":[1,64],"alignment":[2],"with":[3,35],"self-supervised":[4],"models":[5],"has":[6],"been":[7],"shown":[8],"to":[9,39,87,100,123],"improve":[10],"diffusion":[11],"model":[12],"training,":[13],"its":[14],"potential":[15],"for":[16,104],"enhancing":[17],"inference-time":[18],"conditioning":[19,42],"remains":[20],"largely":[21],"unexplored.":[22],"We":[23,96,132],"introduce":[24],"Representation-Aligned":[25],"Guidance":[26],"(REPA-G),":[27],"a":[28,49,62,67,118],"framework":[29],"that":[30,152],"leverages":[31],"these":[32],"aligned":[33],"representations,":[34],"rich":[36],"semantic":[37,89],"properties,":[38],"enable":[40],"test-time":[41],"from":[43,66,80,140],"features":[44],"in":[45],"generation.":[46],"By":[47],"optimizing":[48],"similarity":[50],"objective":[51],"(the":[52],"potential)":[53],"at":[54,76,114,162],"inference,":[55],"we":[56],"steer":[57],"the":[58,105,141],"denoising":[59],"process":[60],"toward":[61],"conditioned":[63],"extracted":[65],"pre-trained":[68],"feature":[69,94],"extractor.":[70],"Our":[71],"method":[72],"provides":[73],"versatile":[74],"control":[75],"multiple":[77],"scales,":[78],"ranging":[79],"fine-grained":[81],"texture":[82],"matching":[83],"via":[84],"single":[85],"patches":[86],"broad":[88],"guidance":[90,137],"using":[91],"global":[92],"image":[93],"tokens.":[95],"further":[97],"extend":[98],"this":[99,136],"multi-concept":[101],"composition,":[102],"allowing":[103],"faithful":[106],"combination":[107],"of":[108],"distinct":[109],"concepts.":[110],"REPA-G":[111],"operates":[112],"entirely":[113],"inference":[115],"time,":[116],"offering":[117],"flexible":[119],"and":[120,149],"precise":[121],"alternative":[122],"often":[124],"ambiguous":[125],"text":[126],"prompts":[127],"or":[128],"coarse":[129],"class":[130],"labels.":[131],"theoretically":[133],"justify":[134],"how":[135],"enables":[138],"sampling":[139],"potential-induced":[142],"tilted":[143],"distribution.":[144],"Quantitative":[145],"results":[146],"on":[147],"ImageNet":[148],"COCO":[150],"demonstrate":[151],"our":[153],"approach":[154],"achieves":[155],"high-quality,":[156],"diverse":[157],"generations.":[158],"Code":[159],"is":[160],"available":[161],"https://github.com/valeoai/REPA-G.":[163]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-06T00:00:00"}
