{"id":"https://openalex.org/W4417124644","doi":"https://doi.org/10.1145/3757377.3763904","title":"In-2-4D: Inbetweening from Two Single-View Images to 4D Generation","display_name":"In-2-4D: Inbetweening from Two Single-View Images to 4D Generation","publication_year":2025,"publication_date":"2025-12-08","ids":{"openalex":"https://openalex.org/W4417124644","doi":"https://doi.org/10.1145/3757377.3763904"},"language":null,"primary_location":{"id":"doi:10.1145/3757377.3763904","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3757377.3763904","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the SIGGRAPH Asia 2025 Conference Papers","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3757377.3763904","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5076328294","display_name":"Sauradip Nag","orcid":"https://orcid.org/0000-0002-2943-6663"},"institutions":[{"id":"https://openalex.org/I18014758","display_name":"Simon Fraser University","ror":"https://ror.org/0213rcc28","country_code":"CA","type":"education","lineage":["https://openalex.org/I18014758"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"Sauradip Nag","raw_affiliation_strings":["Simon Fraser University, Burnaby, Canada"],"affiliations":[{"raw_affiliation_string":"Simon Fraser University, Burnaby, Canada","institution_ids":["https://openalex.org/I18014758"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036688260","display_name":"Daniel Cohen\u2010Or","orcid":"https://orcid.org/0000-0001-6777-7445"},"institutions":[{"id":"https://openalex.org/I16391192","display_name":"Tel Aviv University","ror":"https://ror.org/04mhzgx49","country_code":"IL","type":"education","lineage":["https://openalex.org/I16391192"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Daniel Cohen-Or","raw_affiliation_strings":["Tel Aviv University, Tel Aviv, Israel"],"affiliations":[{"raw_affiliation_string":"Tel Aviv University, Tel Aviv, Israel","institution_ids":["https://openalex.org/I16391192"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100397026","display_name":"Hao Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I18014758","display_name":"Simon Fraser University","ror":"https://ror.org/0213rcc28","country_code":"CA","type":"education","lineage":["https://openalex.org/I18014758"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Hao Zhang","raw_affiliation_strings":["Simon Fraser University, Burnaby, Canada"],"affiliations":[{"raw_affiliation_string":"Simon Fraser University, Burnaby, Canada","institution_ids":["https://openalex.org/I18014758"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5021862056","display_name":"Ali Mahdavi\u2010Amiri","orcid":"https://orcid.org/0000-0002-4693-3565"},"institutions":[{"id":"https://openalex.org/I18014758","display_name":"Simon Fraser University","ror":"https://ror.org/0213rcc28","country_code":"CA","type":"education","lineage":["https://openalex.org/I18014758"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Ali Mahdavi Amiri","raw_affiliation_strings":["Simon Fraser University, Burnaby, Canada"],"affiliations":[{"raw_affiliation_string":"Simon Fraser University, Burnaby, Canada","institution_ids":["https://openalex.org/I18014758"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5076328294"],"corresponding_institution_ids":["https://openalex.org/I18014758"],"apc_list":null,"apc_paid":null,"fwci":1.2784,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.8629554,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"12"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.8191999793052673,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.8191999793052673,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.043800000101327896,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10481","display_name":"Computer Graphics and Visualization Techniques","score":0.02410000003874302,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/interpolation","display_name":"Interpolation (computer graphics)","score":0.48429998755455017},{"id":"https://openalex.org/keywords/motion-field","display_name":"Motion field","score":0.438400000333786},{"id":"https://openalex.org/keywords/motion-interpolation","display_name":"Motion interpolation","score":0.4244999885559082},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.40450000762939453},{"id":"https://openalex.org/keywords/motion-capture","display_name":"Motion capture","score":0.4027000069618225},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.3815999925136566},{"id":"https://openalex.org/keywords/merge","display_name":"Merge (version control)","score":0.375},{"id":"https://openalex.org/keywords/motion-estimation","display_name":"Motion estimation","score":0.3617999851703644},{"id":"https://openalex.org/keywords/affine-transformation","display_name":"Affine transformation","score":0.3276999890804291}],"concepts":[{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.7457000017166138},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.738099992275238},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7067000269889832},{"id":"https://openalex.org/C137800194","wikidata":"https://www.wikidata.org/wiki/Q11713455","display_name":"Interpolation (computer graphics)","level":3,"score":0.48429998755455017},{"id":"https://openalex.org/C124774092","wikidata":"https://www.wikidata.org/wiki/Q6917782","display_name":"Motion field","level":3,"score":0.438400000333786},{"id":"https://openalex.org/C72560505","wikidata":"https://www.wikidata.org/wiki/Q204510","display_name":"Motion interpolation","level":5,"score":0.4244999885559082},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.40450000762939453},{"id":"https://openalex.org/C48007421","wikidata":"https://www.wikidata.org/wiki/Q676252","display_name":"Motion capture","level":3,"score":0.4027000069618225},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.3815999925136566},{"id":"https://openalex.org/C197129107","wikidata":"https://www.wikidata.org/wiki/Q1921621","display_name":"Merge (version control)","level":2,"score":0.375},{"id":"https://openalex.org/C10161872","wikidata":"https://www.wikidata.org/wiki/Q557891","display_name":"Motion estimation","level":2,"score":0.3617999851703644},{"id":"https://openalex.org/C92757383","wikidata":"https://www.wikidata.org/wiki/Q382497","display_name":"Affine transformation","level":2,"score":0.3276999890804291},{"id":"https://openalex.org/C157202957","wikidata":"https://www.wikidata.org/wiki/Q1659609","display_name":"Image warping","level":2,"score":0.32659998536109924},{"id":"https://openalex.org/C155542232","wikidata":"https://www.wikidata.org/wiki/Q736111","display_name":"Optical flow","level":3,"score":0.3043999969959259},{"id":"https://openalex.org/C146159030","wikidata":"https://www.wikidata.org/wiki/Q7625099","display_name":"Structure from motion","level":3,"score":0.29980000853538513},{"id":"https://openalex.org/C65909025","wikidata":"https://www.wikidata.org/wiki/Q1945033","display_name":"Monocular","level":2,"score":0.2957000136375427},{"id":"https://openalex.org/C62354387","wikidata":"https://www.wikidata.org/wiki/Q875399","display_name":"Boundary (topology)","level":2,"score":0.29490000009536743},{"id":"https://openalex.org/C204241405","wikidata":"https://www.wikidata.org/wiki/Q461499","display_name":"Transformation (genetics)","level":3,"score":0.28540000319480896},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.28279998898506165},{"id":"https://openalex.org/C128840427","wikidata":"https://www.wikidata.org/wiki/Q1302174","display_name":"Motion compensation","level":2,"score":0.2827000021934509},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.2797999978065491},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.27489998936653137},{"id":"https://openalex.org/C126795593","wikidata":"https://www.wikidata.org/wiki/Q7333813","display_name":"Rigid transformation","level":2,"score":0.2703000009059906},{"id":"https://openalex.org/C190470478","wikidata":"https://www.wikidata.org/wiki/Q2370229","display_name":"Invariant (physics)","level":2,"score":0.2648000121116638},{"id":"https://openalex.org/C2776863239","wikidata":"https://www.wikidata.org/wiki/Q7936601","display_name":"Visual hull","level":3,"score":0.2574000060558319},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.257099986076355},{"id":"https://openalex.org/C95020103","wikidata":"https://www.wikidata.org/wiki/Q1813492","display_name":"Match moving","level":3,"score":0.2563999891281128},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.2535000145435333},{"id":"https://openalex.org/C82990744","wikidata":"https://www.wikidata.org/wiki/Q166194","display_name":"RGB color model","level":2,"score":0.25119999051094055}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3757377.3763904","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3757377.3763904","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the SIGGRAPH Asia 2025 Conference Papers","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3757377.3763904","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3757377.3763904","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the SIGGRAPH Asia 2025 Conference Papers","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W2294052718","https://openalex.org/W2980523614","https://openalex.org/W4310443750","https://openalex.org/W4312445951","https://openalex.org/W4385318467","https://openalex.org/W4386071957","https://openalex.org/W4386072026","https://openalex.org/W4386075660","https://openalex.org/W4386075787","https://openalex.org/W4386113240","https://openalex.org/W4390872556","https://openalex.org/W4390873135","https://openalex.org/W4390873331","https://openalex.org/W4393149921","https://openalex.org/W4399574574","https://openalex.org/W4400582082","https://openalex.org/W4402713101","https://openalex.org/W4402716105","https://openalex.org/W4402727067","https://openalex.org/W4402727359","https://openalex.org/W4402727731","https://openalex.org/W4403705810","https://openalex.org/W4412673604","https://openalex.org/W4413147835","https://openalex.org/W4415795332","https://openalex.org/W4415795691","https://openalex.org/W4415797420","https://openalex.org/W4415797429","https://openalex.org/W4415798697"],"related_works":[],"abstract_inverted_index":{"We":[0],"pose":[1],"a":[2,28,93,116,145,171,234],"new":[3],"problem,":[4],"In-2-4D,":[5],"for":[6,98],"generative":[7],"4D":[8],"(i.e.,":[9],"3D":[10,146,181,203],"+":[11],"motion)":[12],"inbetweening":[13],"to":[14,21,40,64,108,119,126,214],"interpolate":[15],"two":[16,46],"single-view":[17],"images.":[18],"In":[19],"contrast":[20],"video/4D":[22],"generation":[23],"from":[24],"only":[25],"text":[26],"or":[27,82],"single":[29],"image,":[30],"our":[31,61,242],"interpolative":[32],"task":[33],"can":[34,106],"leverage":[35],"more":[36],"precise":[37],"motion":[38,69,79,99,104,204],"control":[39],"better":[41],"constrain":[42],"the":[43,51,68,76,127,149,159,162,180,185,200,217,239],"generation.":[44],"Given":[45],"monocular":[47],"RGB":[48],"images":[49],"representing":[50],"start":[52],"and":[53,66,88,178,192,211,222,228,244],"end":[54],"states":[55,129],"of":[56,148,187,241],"an":[57],"object":[58,77],"in":[59,70],"motion,":[60,163,182],"goal":[62],"is":[63],"generate":[65,135],"reconstruct":[67],"4D,":[71],"without":[72],"making":[73],"assumptions":[74],"on":[75],"category,":[78],"type,":[80],"length,":[81],"complexity.":[83],"To":[84,111,174],"handle":[85],"such":[86],"arbitrary":[87],"diverse":[89],"motions,":[90,133],"we":[91,114,143,183,198,237],"utilize":[92],"foundational":[94],"video":[95],"interpolation":[96],"model":[97],"prediction.":[100],"However,":[101],"large":[102],"frame-to-frame":[103],"gaps":[105],"lead":[107],"ambiguous":[109],"interpretations.":[110],"this":[112],"end,":[113],"employ":[115],"hierarchical":[117],"approach":[118],"identify":[120],"keyframes":[121],"that":[122],"are":[123],"visually":[124],"close":[125],"input":[128],"while":[130],"exhibiting":[131],"significant":[132],"then":[134],"smooth":[136,221],"fragments":[137],"between":[138],"them.":[139],"For":[140],"each":[141],"fragment,":[142],"construct":[144],"representation":[147],"keyframe":[150],"using":[151],"Gaussian":[152],"Splatting":[153],"(3DGS).":[154],"The":[155],"temporal":[156,176],"frames":[157],"within":[158],"fragment":[160],"guide":[161],"enabling":[164],"their":[165],"transformation":[166,195],"into":[167],"dynamic":[168],"3DGS":[169],"through":[170],"deformation":[172,209],"field.":[173],"improve":[175],"consistency":[177],"refine":[179],"expand":[184],"self-attention":[186],"multi-view":[188],"diffusion":[189],"across":[190],"timesteps":[191],"apply":[193],"rigid":[194],"regularization.":[196],"Finally,":[197],"merge":[199],"independently":[201],"generated":[202],"segments":[205],"by":[206],"interpolating":[207],"boundary":[208],"fields":[210],"optimizing":[212],"them":[213],"align":[215],"with":[216],"guiding":[218],"video,":[219],"ensuring":[220],"flicker-free":[223],"transitions.":[224],"Through":[225],"extensive":[226],"qualitative":[227],"quantitive":[229],"experiments":[230],"as":[231,233],"well":[232],"user":[235],"study,":[236],"demonstrate":[238],"effectiveness":[240],"method":[243],"design":[245],"choices.":[246]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-12-08T00:00:00"}
