{"id":"https://openalex.org/W4392982007","doi":"https://doi.org/10.1109/cvmi59935.2023.10464441","title":"Enhancing the Video Editing Capabilities of Text-to-Video Generators Using DDPM Inversion","display_name":"Enhancing the Video Editing Capabilities of Text-to-Video Generators Using DDPM Inversion","publication_year":2023,"publication_date":"2023-12-10","ids":{"openalex":"https://openalex.org/W4392982007","doi":"https://doi.org/10.1109/cvmi59935.2023.10464441"},"language":"en","primary_location":{"id":"doi:10.1109/cvmi59935.2023.10464441","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvmi59935.2023.10464441","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Conference on Computer Vision and Machine Intelligence (CVMI)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5011951994","display_name":"W. Wilfred Godfrey","orcid":"https://orcid.org/0000-0002-0720-2647"},"institutions":[{"id":"https://openalex.org/I9747756","display_name":"Atal Bihari Vajpayee Indian Institute of Information Technology and Management","ror":"https://ror.org/008b3ap06","country_code":"IN","type":"education","lineage":["https://openalex.org/I9747756"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"W Wilfred Godfrey","raw_affiliation_strings":["ABV-IIITM Gwalior,Computer Science,Gwalior,India","Computer Science, ABV-IIITM Gwalior, Gwalior, India"],"affiliations":[{"raw_affiliation_string":"ABV-IIITM Gwalior,Computer Science,Gwalior,India","institution_ids":["https://openalex.org/I9747756"]},{"raw_affiliation_string":"Computer Science, ABV-IIITM Gwalior, Gwalior, India","institution_ids":["https://openalex.org/I9747756"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5094198853","display_name":"Abhinav Ratna","orcid":null},"institutions":[{"id":"https://openalex.org/I9747756","display_name":"Atal Bihari Vajpayee Indian Institute of Information Technology and Management","ror":"https://ror.org/008b3ap06","country_code":"IN","type":"education","lineage":["https://openalex.org/I9747756"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Abhinav Ratna","raw_affiliation_strings":["ABV-IIITM Gwalior,Information Technology,Gwalior,India","Information Technology, ABV-IIITM Gwalior, Gwalior, India"],"affiliations":[{"raw_affiliation_string":"ABV-IIITM Gwalior,Information Technology,Gwalior,India","institution_ids":["https://openalex.org/I9747756"]},{"raw_affiliation_string":"Information Technology, ABV-IIITM Gwalior, Gwalior, India","institution_ids":["https://openalex.org/I9747756"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5011951994"],"corresponding_institution_ids":["https://openalex.org/I9747756"],"apc_list":null,"apc_paid":null,"fwci":0.2674,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.57046599,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T14276","display_name":"Power Systems and Technologies","score":0.7390000224113464,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T14276","display_name":"Power Systems and Technologies","score":0.7390000224113464,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.6574000120162964,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13734","display_name":"Advanced Computational Techniques and Applications","score":0.600600004196167,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6735889315605164},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.4109407067298889},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.3460831642150879}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6735889315605164},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.4109407067298889},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.3460831642150879}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cvmi59935.2023.10464441","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvmi59935.2023.10464441","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Conference on Computer Vision and Machine Intelligence (CVMI)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W1901129140","https://openalex.org/W2916743882","https://openalex.org/W3036167779","https://openalex.org/W3121370741","https://openalex.org/W3166396011","https://openalex.org/W3168053944","https://openalex.org/W4289785045","https://openalex.org/W4310695675","https://openalex.org/W4366551601","https://openalex.org/W4380137036","https://openalex.org/W4385527149","https://openalex.org/W4386076532","https://openalex.org/W4390678101","https://openalex.org/W4390873135","https://openalex.org/W4402753991"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W2382290278","https://openalex.org/W2478288626","https://openalex.org/W4391913857","https://openalex.org/W2350741829","https://openalex.org/W2530322880"],"abstract_inverted_index":{"Text-to-video":[0],"generation":[1,50,96,126],"has":[2,37],"garnered":[3],"significant":[4],"attention":[5],"due":[6],"to":[7,62,122],"its":[8],"potential":[9],"applications":[10],"in":[11,43,72],"various":[12],"domains,":[13],"such":[14],"as":[15,39],"video":[16,77,131],"synthesis,":[17],"content":[18,161],"creation,":[19],"and":[20,75,152],"entertainment.":[21],"The":[22],"one-shot":[23,94],"learning":[24],"approach,":[25],"wherein":[26],"a":[27,40,55,116,129,145],"single":[28,117],"text-video":[29,118],"pair":[30,119],"is":[31,120],"utilized":[32],"for":[33],"generating":[34],"corresponding":[35],"videos,":[36],"emerged":[38],"promising":[41],"technique":[42,110],"this":[44,80],"realm.":[45],"This":[46],"approach":[47],"involves":[48],"the":[49,64,90,100,103,112,124,135,154],"of":[51,93,102,137,149],"videos":[52],"based":[53],"on":[54],"given":[56],"text":[57],"prompt,":[58],"with":[59],"subsequent":[60],"editing":[61,91,139],"refine":[63],"output.":[65,132],"However,":[66],"existing":[67,113],"methods":[68],"often":[69],"exhibit":[70],"limitations":[71],"achieving":[73],"intricate":[74],"nuanced":[76],"editing.":[78],"In":[79],"research":[81],"paper,":[82],"we":[83,141],"present":[84],"an":[85],"innovative":[86],"framework":[87],"that":[88],"enhances":[89],"capabilities":[92],"text-to-video":[95],"models.":[97],"We":[98],"propose":[99],"integration":[101],"Denoising":[104],"Diffusion":[105],"Probabilistic":[106],"Model":[107],"(DDPM)":[108],"inversion":[109],"into":[111],"pipeline.":[114],"Initially,":[115],"used":[121],"guide":[123],"initial":[125],"process,":[127],"yielding":[128],"foundational":[130],"To":[133],"address":[134],"challenge":[136],"limited":[138],"potential,":[140],"leverage":[142],"DDPM":[143],"inversion,":[144],"novel":[146],"method":[147],"capable":[148],"iteratively":[150],"refining":[151],"modifying":[153],"generated":[155],"video's":[156],"structure":[157],"while":[158],"preserving":[159],"high-level":[160],"details.":[162]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
