{"id":"https://openalex.org/W4413156276","doi":"https://doi.org/10.1109/cvpr52734.2025.02715","title":"DiffVsgg: Diffusion-Driven Online Video Scene Graph Generation","display_name":"DiffVsgg: Diffusion-Driven Online Video Scene Graph Generation","publication_year":2025,"publication_date":"2025-06-10","ids":{"openalex":"https://openalex.org/W4413156276","doi":"https://doi.org/10.1109/cvpr52734.2025.02715"},"language":"en","primary_location":{"id":"doi:10.1109/cvpr52734.2025.02715","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr52734.2025.02715","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103246723","display_name":"Mu Chen","orcid":"https://orcid.org/0009-0003-8283-3486"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Mu Chen","raw_affiliation_strings":["Zhejiang University,ReLER, CCAI"],"affiliations":[{"raw_affiliation_string":"Zhejiang University,ReLER, CCAI","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014945486","display_name":"Liulei Li","orcid":"https://orcid.org/0000-0002-4637-0328"},"institutions":[{"id":"https://openalex.org/I114017466","display_name":"University of Technology Sydney","ror":"https://ror.org/03f0f6041","country_code":"AU","type":"education","lineage":["https://openalex.org/I114017466"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Liulei Li","raw_affiliation_strings":["University of Technology Sydney,ReLER, AAII"],"affiliations":[{"raw_affiliation_string":"University of Technology Sydney,ReLER, AAII","institution_ids":["https://openalex.org/I114017466"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101433884","display_name":"Wenguan Wang","orcid":"https://orcid.org/0000-0002-0802-9567"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenguan Wang","raw_affiliation_strings":["Zhejiang University,ReLER, CCAI"],"affiliations":[{"raw_affiliation_string":"Zhejiang University,ReLER, CCAI","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100381753","display_name":"Shuicheng Yan","orcid":"https://orcid.org/0000-0001-8906-3777"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yi Yang","raw_affiliation_strings":["Zhejiang University,ReLER, CCAI"],"affiliations":[{"raw_affiliation_string":"Zhejiang University,ReLER, CCAI","institution_ids":["https://openalex.org/I76130692"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5103246723"],"corresponding_institution_ids":["https://openalex.org/I76130692"],"apc_list":null,"apc_paid":null,"fwci":1.319,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.84256517,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"29161","last_page":"29172"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.996399998664856,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.98580002784729,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7262297868728638},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.49428296089172363},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.47441667318344116},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.4458162784576416}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7262297868728638},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.49428296089172363},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47441667318344116},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.4458162784576416}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cvpr52734.2025.02715","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr52734.2025.02715","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null},{"id":"https://openalex.org/F4320338464","display_name":"Natural Science Foundation of Zhejiang Province","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":91,"referenced_works":["https://openalex.org/W2139501017","https://openalex.org/W2142900973","https://openalex.org/W2337252826","https://openalex.org/W2479423890","https://openalex.org/W2579549467","https://openalex.org/W2605736949","https://openalex.org/W2607855566","https://openalex.org/W2763058042","https://openalex.org/W2883170015","https://openalex.org/W2886970679","https://openalex.org/W2888096830","https://openalex.org/W2950096400","https://openalex.org/W2954199749","https://openalex.org/W2962737704","https://openalex.org/W2962749380","https://openalex.org/W2962785943","https://openalex.org/W2963150697","https://openalex.org/W2963514444","https://openalex.org/W2963536419","https://openalex.org/W2963541336","https://openalex.org/W2963649796","https://openalex.org/W2963890755","https://openalex.org/W2963902384","https://openalex.org/W2963938081","https://openalex.org/W2964089981","https://openalex.org/W2964092725","https://openalex.org/W2981385984","https://openalex.org/W2981851019","https://openalex.org/W2982515679","https://openalex.org/W2986953233","https://openalex.org/W2992049873","https://openalex.org/W3034538190","https://openalex.org/W3034679267","https://openalex.org/W3035017890","https://openalex.org/W3035218869","https://openalex.org/W3035440494","https://openalex.org/W3081642947","https://openalex.org/W3104862079","https://openalex.org/W3119381934","https://openalex.org/W3127094814","https://openalex.org/W3174865181","https://openalex.org/W3175528717","https://openalex.org/W3186187670","https://openalex.org/W3186621246","https://openalex.org/W3193902142","https://openalex.org/W3195421894","https://openalex.org/W3201861986","https://openalex.org/W3205051885","https://openalex.org/W4214612132","https://openalex.org/W4214693531","https://openalex.org/W4214942454","https://openalex.org/W4225868495","https://openalex.org/W4292829030","https://openalex.org/W4304080820","https://openalex.org/W4312561757","https://openalex.org/W4312563197","https://openalex.org/W4312587667","https://openalex.org/W4312682661","https://openalex.org/W4312757006","https://openalex.org/W4312933868","https://openalex.org/W4313007081","https://openalex.org/W4319300235","https://openalex.org/W4366352717","https://openalex.org/W4383097625","https://openalex.org/W4386072171","https://openalex.org/W4386075801","https://openalex.org/W4386075828","https://openalex.org/W4386075963","https://openalex.org/W4388191728","https://openalex.org/W4390872705","https://openalex.org/W4390873119","https://openalex.org/W4390873429","https://openalex.org/W4390873752","https://openalex.org/W4390874160","https://openalex.org/W4391468387","https://openalex.org/W4393149283","https://openalex.org/W4394698791","https://openalex.org/W4395447445","https://openalex.org/W4400856224","https://openalex.org/W4402618831","https://openalex.org/W4402727002","https://openalex.org/W4402753518","https://openalex.org/W4402753781","https://openalex.org/W4402754144","https://openalex.org/W4402944023","https://openalex.org/W4402961670","https://openalex.org/W4402961719","https://openalex.org/W4403791750","https://openalex.org/W4403947105","https://openalex.org/W4407151317","https://openalex.org/W4413147097"],"related_works":["https://openalex.org/W2772917594","https://openalex.org/W2036807459","https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407","https://openalex.org/W2079911747","https://openalex.org/W1969923398"],"abstract_inverted_index":{"Top-leading":[0],"solutions":[1],"for":[2,145,160,180],"Video":[3],"Scene":[4],"Graph":[5],"Generation":[6],"(VSGG)":[7],"typically":[8],"adopt":[9],"an":[10,51,60,104],"offline":[11],"pipeline.":[12],"Though":[13],"demonstrating":[14],"promising":[15],"performance,":[16],"they":[17],"remain":[18],"unable":[19],"to":[20,123,142,174],"handle":[21],"real-time":[22],"video":[23],"streams":[24],"and":[25,92],"consume":[26],"large":[27],"GPU":[28],"memory.":[29],"Moreover,":[30],"these":[31],"approaches":[32],"fall":[33],"short":[34],"in":[35],"temporal":[36,44,156],"reasoning,":[37,157],"merely":[38],"aggregating":[39],"frame-level":[40],"predictions":[41,159],"over":[42],"a":[43,78,114,125],"context.":[45],"In":[46],"response,":[47],"we":[48,82,112],"introduce":[49],"DiffVsgg,":[50],"online":[52],"VSGG":[53],"solution":[54],"that":[55],"frames":[56,162,167],"this":[57],"task":[58],"as":[59,122,139,168],"iterative":[61],"scene":[62,148],"graph":[63,93,149],"update":[64],"problem.":[65],"Drawing":[66],"inspiration":[67],"from":[68],"Latent":[69],"Diffusion":[70],"Models":[71],"(LDMs)":[72],"which":[73,128],"generate":[74],"images":[75],"via":[76],"denoising":[77],"latent":[79],"feature":[80,100],"embedding,":[81],"unify":[83],"the":[84,131,140,169,176,192],"decoding":[85],"of":[86,109,165,172,188,194],"object":[87,110,146],"classification,":[88,147],"bounding":[89],"box":[90],"regression,":[91],"generation":[94],"three":[95,186],"tasks":[96],"using":[97],"one":[98],"shared":[99],"embedding.":[101],"Then,":[102],"given":[103],"embedding":[105,127,136],"containing":[106],"unified":[107],"features":[108],"pairs,":[111],"conduct":[113],"step-wise":[115],"Denoising":[116],"on":[117,185],"it":[118],"within":[119],"LDMs,":[120,173],"so":[121],"deliver":[124],"clean":[126],"clearly":[129],"indicates":[130],"relationships":[132],"between":[133],"objects.":[134],"This":[135],"then":[137],"serves":[138],"input":[141],"task-specific":[143],"heads":[144],"generation,":[150],"etc.":[151],"DiffVsgg":[152],"further":[153],"facilitates":[154],"continuous":[155],"where":[158],"subsequent":[161],"leverage":[163],"results":[164],"past":[166],"conditional":[170],"inputs":[171],"guide":[175],"reverse":[177],"diffusion":[178],"process":[179],"current":[181],"frames.":[182],"Extensive":[183],"experiments":[184],"setups":[187],"Action":[189],"Genome":[190],"demonstrate":[191],"superiority":[193],"DiffVsgg.":[195]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2025-12-28T23:10:05.387466","created_date":"2025-10-10T00:00:00"}
