{"id":"https://openalex.org/W7161952949","doi":"https://doi.org/10.48550/arxiv.2605.20624","title":"Accelerating Video Inverse Problem Solvers with Autoregressive Diffusion Models","display_name":"Accelerating Video Inverse Problem Solvers with Autoregressive Diffusion Models","publication_year":2026,"publication_date":"2026-05-20","ids":{"openalex":"https://openalex.org/W7161952949","doi":"https://doi.org/10.48550/arxiv.2605.20624"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.20624","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.20624","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.20624","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5128776589","display_name":"Taesung Kwon","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kwon, Taesung","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125094926","display_name":"Jonghyun Park","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Park, Jonghyun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006604581","display_name":"Hyungjin Chung","orcid":"https://orcid.org/0000-0003-3202-0893"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chung, Hyungjin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5136639478","display_name":"Jong Chul Ye","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ye, Jong Chul","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.24330000579357147,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.24330000579357147,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10500","display_name":"Sparse and Compressive Sensing Techniques","score":0.09059999883174896,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.08749999850988388,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/solver","display_name":"Solver","score":0.5625},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.5594000220298767},{"id":"https://openalex.org/keywords/autoregressive-model","display_name":"Autoregressive model","score":0.5504000186920166},{"id":"https://openalex.org/keywords/inverse-problem","display_name":"Inverse problem","score":0.44670000672340393},{"id":"https://openalex.org/keywords/throughput","display_name":"Throughput","score":0.4122999906539917},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.41179999709129333},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.38940000534057617}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7305999994277954},{"id":"https://openalex.org/C2778770139","wikidata":"https://www.wikidata.org/wiki/Q1966904","display_name":"Solver","level":2,"score":0.5625},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.5594000220298767},{"id":"https://openalex.org/C159877910","wikidata":"https://www.wikidata.org/wiki/Q2202883","display_name":"Autoregressive model","level":2,"score":0.5504000186920166},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.46299999952316284},{"id":"https://openalex.org/C135252773","wikidata":"https://www.wikidata.org/wiki/Q1567213","display_name":"Inverse problem","level":2,"score":0.44670000672340393},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.4122999906539917},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.41179999709129333},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.38940000534057617},{"id":"https://openalex.org/C46637626","wikidata":"https://www.wikidata.org/wiki/Q6693015","display_name":"Low latency (capital markets)","level":2,"score":0.3614000082015991},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.34610000252723694},{"id":"https://openalex.org/C207467116","wikidata":"https://www.wikidata.org/wiki/Q4385666","display_name":"Inverse","level":2,"score":0.33889999985694885},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.3327000141143799},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.31470000743865967},{"id":"https://openalex.org/C2986160907","wikidata":"https://www.wikidata.org/wiki/Q220499","display_name":"Video streaming","level":2,"score":0.29660001397132874},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.289900004863739},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.2793000042438507},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2743000090122223},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.2508000135421753}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.20624","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.20624","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.20624","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.20624","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Diffusion":[0],"models":[1,61],"provide":[2],"powerful":[3],"priors":[4],"for":[5],"zero-shot":[6],"video":[7,25,59],"inverse":[8],"problems,":[9],"but":[10],"their":[11],"real-time":[12,161],"deployment":[13],"is":[14],"hindered":[15],"by":[16,23],"two":[17],"inefficiencies:":[18],"high":[19],"initial":[20,95],"latency":[21,71,96],"caused":[22],"holistic":[24],"restoration,":[26],"and":[27,101,151],"low":[28],"throughput":[29,103,137],"resulting":[30],"from":[31,97,104],"multiple":[32],"VAE":[33],"passes":[34],"to":[35,62,88,99,106,138],"enforce":[36],"measurement":[37,126],"consistency":[38,127],"in":[39,65],"pixel":[40],"space.":[41],"To":[42],"overcome":[43],"these":[44],"limitations,":[45],"we":[46],"propose":[47],"Autoregressive":[48],"Video":[49],"Inverse":[50],"problem":[51],"Solver":[52],"(AVIS).":[53],"The":[54],"AVIS":[55,74,92,122,133],"framework":[56],"leverages":[57],"autoregressive":[58],"diffusion":[60,77],"restore":[63],"videos":[64],"a":[66,79,117,142,153],"streaming":[67],"manner,":[68],"naturally":[69],"eliminating":[70],"bottlenecks.":[72],"Specifically,":[73],"initializes":[75],"reverse":[76],"with":[78],"measurement-consistent":[80],"estimate,":[81],"reducing":[82],"the":[83,130,158],"required":[84],"sampling":[85],"steps.":[86],"Compared":[87],"leading":[89],"non-autoregressive":[90],"solvers,":[91],"drastically":[93],"reduces":[94],"114s":[98],"4s":[100],"increases":[102],"0.71":[105],"1.18":[107],"FPS":[108,140],"while":[109,147],"achieving":[110,152],"superior":[111],"restoration":[112],"quality.":[113],"We":[114],"further":[115],"introduce":[116],"highly":[118],"accelerated":[119],"variant,":[120],"dubbed":[121],"Flash,":[123],"that":[124],"enforces":[125],"solely":[128],"on":[129,141],"first":[131],"chunk.":[132],"Flash":[134],"substantially":[135],"boosts":[136],"5.91":[139],"single":[143],"RTX":[144],"4090":[145],"GPU":[146],"maintaining":[148],"competitive":[149],"performance":[150],"favorable":[154],"efficiency-performance":[155],"trade-off,":[156],"paving":[157],"way":[159],"toward":[160],"deployment.":[162]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-22T00:00:00"}
