{"id":"https://openalex.org/W7160536446","doi":"https://doi.org/10.48550/arxiv.2605.04569","title":"LIVEditor-14B: Lightning Unified Video Editing via In-Context Sparse Attention","display_name":"LIVEditor-14B: Lightning Unified Video Editing via In-Context Sparse Attention","publication_year":2026,"publication_date":"2026-05-06","ids":{"openalex":"https://openalex.org/W7160536446","doi":"https://doi.org/10.48550/arxiv.2605.04569"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.04569","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.04569","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.04569","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5073038991","display_name":"Shitong Shao","orcid":"https://orcid.org/0000-0003-4689-6140"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shao, Shitong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135555216","display_name":"Zikai Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Zikai","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135627822","display_name":"Haopeng Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Haopeng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135607455","display_name":"Yingwei Song","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Song, Yingwei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135552422","display_name":"Wenliang Zhong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhong, Wenliang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032096158","display_name":"Lichen Bai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bai, Lichen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5135609781","display_name":"Zeke Xie","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xie, Zeke","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.2506999969482422,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.2506999969482422,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.24979999661445618,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.23070000112056732,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.6802999973297119},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5848000049591064},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.49889999628067017},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.47440001368522644},{"id":"https://openalex.org/keywords/acceleration","display_name":"Acceleration","score":0.3935999870300293},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.3345000147819519},{"id":"https://openalex.org/keywords/video-editing","display_name":"Video editing","score":0.3262999951839447},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.32330000400543213}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8256999850273132},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.6802999973297119},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5848000049591064},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.49889999628067017},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.47440001368522644},{"id":"https://openalex.org/C117896860","wikidata":"https://www.wikidata.org/wiki/Q11376","display_name":"Acceleration","level":2,"score":0.3935999870300293},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.39340001344680786},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.3345000147819519},{"id":"https://openalex.org/C2780310081","wikidata":"https://www.wikidata.org/wiki/Q1154312","display_name":"Video editing","level":2,"score":0.3262999951839447},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.32330000400543213},{"id":"https://openalex.org/C56372850","wikidata":"https://www.wikidata.org/wiki/Q1050404","display_name":"Sparse matrix","level":3,"score":0.32260000705718994},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.3012000024318695},{"id":"https://openalex.org/C69398868","wikidata":"https://www.wikidata.org/wiki/Q129052","display_name":"Lightning (connector)","level":3,"score":0.29170000553131104},{"id":"https://openalex.org/C129844170","wikidata":"https://www.wikidata.org/wiki/Q41299","display_name":"Quadratic equation","level":2,"score":0.2906000018119812},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.28999999165534973},{"id":"https://openalex.org/C81845259","wikidata":"https://www.wikidata.org/wiki/Q290117","display_name":"Quadratic programming","level":2,"score":0.28870001435279846},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.27630001306533813},{"id":"https://openalex.org/C2781215313","wikidata":"https://www.wikidata.org/wiki/Q3493345","display_name":"SPARK (programming language)","level":2,"score":0.2644999921321869},{"id":"https://openalex.org/C158495155","wikidata":"https://www.wikidata.org/wiki/Q2369151","display_name":"Visual search","level":2,"score":0.2614000141620636},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.25609999895095825}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.04569","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.04569","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.04569","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.04569","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Video":[0],"editing":[1,121],"has":[2],"evolved":[3],"toward":[4],"In-Context":[5],"Learning":[6],"(ICL)":[7],"paradigms,":[8],"yet":[9],"the":[10,29],"resulting":[11],"quadratic":[12],"attention":[13,99],"costs":[14],"create":[15],"a":[16,88,104,117,126,133,143],"critical":[17],"computational":[18],"bottleneck.":[19],"In":[20],"this":[21],"work,":[22],"we":[23,59,113],"propose":[24],"In-context":[25],"Sparse":[26],"Attention":[27],"(ISA),":[28],"first":[30],"near-lossless":[31,159],"empirical":[32],"sparse":[33,110],"framework":[34],"tailored":[35],"for":[36],"ICL":[37],"video":[38,120],"editing.":[39],"Our":[40],"design":[41],"is":[42],"grounded":[43],"in":[44,146],"two":[45],"key":[46],"insights:":[47],"first,":[48],"context":[49],"tokens":[50],"exhibit":[51],"significantly":[52],"lower":[53],"saliency":[54],"than":[55],"source":[56],"tokens;":[57],"second,":[58],"theoretically":[60],"prove":[61],"and":[62,100,125,156],"empirically":[63],"validate":[64],"that":[65,93,131,140],"Query":[66],"sharpness":[67],"correlates":[68],"with":[69],"approximation":[70],"error.":[71],"Motivated":[72],"by":[73,87],"these":[74],"findings,":[75],"ISA":[76,124],"implements":[77],"an":[78],"efficient":[79,106],"pre-selection":[80],"strategy":[81],"to":[82,97,103],"prune":[83],"redundant":[84],"context,":[85],"followed":[86],"dynamic":[89],"query":[90],"grouping":[91],"mechanism":[92],"routes":[94],"high-error":[95],"queries":[96],"full":[98],"low-error":[101],"ones":[102],"computationally":[105],"0-th":[107],"order":[108],"Taylor":[109],"attention.":[111],"Furthermore,":[112],"build":[114],"\\textbf{\\texttt{LIVEditor-14B}}":[115],",":[116],"novel":[118],"lightning":[119],"model":[122],"via":[123],"proposed":[127],"video-editing":[128],"data":[129],"pipeline":[130],"curated":[132],"1.7M":[134],"high-quality":[135],"dataset.":[136],"Extensive":[137],"experiments":[138],"demonstrate":[139],"LIVEditor-14B":[141],"achieves":[142],"$\\sim$60%":[144],"reduction":[145],"attention-module":[147],"latency":[148],"while":[149],"surpassing":[150],"state-of-the-art":[151],"methods":[152],"across":[153],"EditVerseBench,":[154],"IVE-Bench,":[155],"VIE-Bench,":[157],"delivering":[158],"acceleration":[160],"without":[161],"compromising":[162],"visual":[163],"fidelity.":[164]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-08T00:00:00"}
