{"id":"https://openalex.org/W7161719389","doi":"https://doi.org/10.48550/arxiv.2605.17543","title":"HL-OutPaint: Coarse-to-Fine Video Outpainting for High-Resolution Long-Range Videos","display_name":"HL-OutPaint: Coarse-to-Fine Video Outpainting for High-Resolution Long-Range Videos","publication_year":2026,"publication_date":"2026-05-17","ids":{"openalex":"https://openalex.org/W7161719389","doi":"https://doi.org/10.48550/arxiv.2605.17543"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.17543","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.17543","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.17543","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5136470348","display_name":"Jeongeun Park","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Park, Jeongeun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136457173","display_name":"Janghyeok Han","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Han, Janghyeok","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002189569","display_name":"Geonung Kim","orcid":"https://orcid.org/0000-0003-0806-6963"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Geonung","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136463807","display_name":"Hyun-Seung Lee","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lee, Hyun-Seung","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006605032","display_name":"Kyuha Choi","orcid":"https://orcid.org/0000-0002-4271-6862"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Choi, Kyuha","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028703681","display_name":"Youngseok Han","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Han, Youngseok","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5136473093","display_name":"Sunghyun Cho","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cho, Sunghyun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.975600004196167,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.975600004196167,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.0026000000070780516,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.002099999925121665,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/extrapolation","display_name":"Extrapolation","score":0.595300018787384},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.5422999858856201},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.5267000198364258},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.5192999839782715},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.5188000202178955},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5169000029563904},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.4756999909877777}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8083999752998352},{"id":"https://openalex.org/C132459708","wikidata":"https://www.wikidata.org/wiki/Q744069","display_name":"Extrapolation","level":2,"score":0.595300018787384},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.5422999858856201},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.5267000198364258},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.5192999839782715},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.5188000202178955},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5169000029563904},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4771000146865845},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.4756999909877777},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.4235999882221222},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.36719998717308044},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.36640000343322754},{"id":"https://openalex.org/C159620131","wikidata":"https://www.wikidata.org/wiki/Q1938983","display_name":"Spatial analysis","level":2,"score":0.3582000136375427},{"id":"https://openalex.org/C10161872","wikidata":"https://www.wikidata.org/wiki/Q557891","display_name":"Motion estimation","level":2,"score":0.30979999899864197},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.29739999771118164},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.2840999960899353},{"id":"https://openalex.org/C145912823","wikidata":"https://www.wikidata.org/wiki/Q113558","display_name":"Dynamics (music)","level":2,"score":0.28380000591278076}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.17543","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.17543","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.17543","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.17543","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Video":[0],"outpainting":[1,71,158],"generates":[2],"plausible":[3],"visual":[4],"content":[5],"beyond":[6],"the":[7,104],"original":[8],"spatial":[9,34,183,202],"extent":[10],"of":[11,46],"a":[12,15,68,79,83,93,113,147],"video,":[13],"playing":[14],"key":[16],"role":[17],"in":[18,146,197],"adapting":[19],"videos":[20],"to":[21,59,136,159],"diverse":[22],"display":[23],"formats.":[24],"To":[25],"support":[26],"such":[27],"use":[28],"cases,":[29],"it":[30],"must":[31],"enable":[32],"large":[33,182],"extrapolation":[35,203],"over":[36],"long":[37,74,186,205],"sequences.":[38,75,188,207],"However,":[39],"most":[40],"existing":[41,195],"methods":[42,196],"address":[43],"only":[44],"one":[45],"these":[47],"challenges":[48],"or":[49],"lack":[50],"explicit":[51],"mechanisms":[52],"for":[53,73,181],"ensuring":[54],"global":[55,98,122,169],"spatio-temporal":[56],"consistency,":[57],"leading":[58],"notable":[60],"limitations.":[61],"In":[62],"this":[63,152],"paper,":[64],"we":[65],"propose":[66],"HL-OutPaint,":[67],"high-resolution":[69,157],"video":[70,187,206],"framework":[72,176],"Our":[76],"approach":[77],"follows":[78],"coarse-to-fine":[80],"strategy":[81],"with":[82,124],"two-stage":[84],"pipeline.":[85],"We":[86],"first":[87],"construct":[88],"Global":[89],"Coarse":[90],"Guidance":[91],"(GCG),":[92],"low-resolution":[94],"representation":[95],"that":[96,119,192],"captures":[97],"structure":[99,170],"and":[100,128,142,163,185,204],"dominant":[101],"motion":[102],"across":[103],"video.":[105],"Unlike":[106],"naive":[107],"downsampling,":[108],"GCG":[109,135],"is":[110],"built":[111],"via":[112],"novel":[114],"global-local":[115],"frame":[116],"swapping":[117],"mechanism":[118],"couples":[120],"sparse":[121],"keyframes":[123],"local":[125],"temporal":[126,144],"windows":[127],"exchanges":[129],"information":[130],"during":[131],"sampling.":[132],"This":[133],"enables":[134],"encode":[137],"both":[138],"long-term":[139],"structural":[140],"consistency":[141],"short-term":[143],"dynamics":[145],"unified":[148],"representation.":[149],"Guided":[150],"by":[151],"representation,":[153],"HL-OutPaint":[154,193],"then":[155],"performs":[156],"generate":[160],"spatially":[161],"detailed":[162],"temporally":[164],"consistent":[165],"content.":[166],"By":[167],"separating":[168],"modeling":[171],"from":[172],"fine-grained":[173],"synthesis,":[174],"our":[175],"achieves":[177],"stable,":[178],"coherent":[179],"generation":[180],"expansion":[184],"Extensive":[189],"experiments":[190],"show":[191],"outperforms":[194],"challenging":[198],"scenarios":[199],"involving":[200],"wide":[201]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-20T00:00:00"}
