{"id":"https://openalex.org/W2981385984","doi":"https://doi.org/10.1145/3343031.3351058","title":"Video Relation Detection with Spatio-Temporal Graph","display_name":"Video Relation Detection with Spatio-Temporal Graph","publication_year":2019,"publication_date":"2019-10-15","ids":{"openalex":"https://openalex.org/W2981385984","doi":"https://doi.org/10.1145/3343031.3351058","mag":"2981385984"},"language":"en","primary_location":{"id":"doi:10.1145/3343031.3351058","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3343031.3351058","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 27th ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5082237060","display_name":"Xufeng Qian","orcid":null},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xufeng Qian","raw_affiliation_strings":["Zhejiang University, Zhejiang Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Zhejiang University, Zhejiang Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008666077","display_name":"Yueting Zhuang","orcid":"https://orcid.org/0000-0001-9017-2508"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yueting Zhuang","raw_affiliation_strings":["Zhejiang University, Zhejiang Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Zhejiang University, Zhejiang Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100696471","display_name":"Yimeng Li","orcid":"https://orcid.org/0000-0002-5658-3706"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yimeng Li","raw_affiliation_strings":["Zhejiang University, Zhejiang Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Zhejiang University, Zhejiang Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112867700","display_name":"Shaoning Xiao","orcid":null},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shaoning Xiao","raw_affiliation_strings":["Zhejiang University, Zhejiang Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Zhejiang University, Zhejiang Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085955762","display_name":"Shiliang Pu","orcid":"https://orcid.org/0000-0001-5269-7821"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shiliang Pu","raw_affiliation_strings":["Hikvision Research Institute, Zhejiang Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Hikvision Research Institute, Zhejiang Hangzhou, China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101485989","display_name":"Jun Xiao","orcid":"https://orcid.org/0000-0002-6142-9914"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jun Xiao","raw_affiliation_strings":["Zhejiang University, Zhejiang Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Zhejiang University, Zhejiang Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5082237060"],"corresponding_institution_ids":["https://openalex.org/I76130692"],"apc_list":null,"apc_paid":null,"fwci":4.6562,"has_fulltext":false,"cited_by_count":79,"citation_normalized_percentile":{"value":0.95960322,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"84","last_page":"93"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8410350680351257},{"id":"https://openalex.org/keywords/relation","display_name":"Relation (database)","score":0.5911862850189209},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5763400793075562},{"id":"https://openalex.org/keywords/margin","display_name":"Margin (machine learning)","score":0.5376464128494263},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5171788930892944},{"id":"https://openalex.org/keywords/spatial-relation","display_name":"Spatial relation","score":0.5033645033836365},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.48752281069755554},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.4460747539997101},{"id":"https://openalex.org/keywords/convolution","display_name":"Convolution (computer science)","score":0.4421963393688202},{"id":"https://openalex.org/keywords/association","display_name":"Association (psychology)","score":0.4177358150482178},{"id":"https://openalex.org/keywords/predicate","display_name":"Predicate (mathematical logic)","score":0.41551920771598816},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.38780784606933594},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.35800251364707947},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3263102173805237},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.3031849265098572},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.16107818484306335}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8410350680351257},{"id":"https://openalex.org/C25343380","wikidata":"https://www.wikidata.org/wiki/Q277521","display_name":"Relation (database)","level":2,"score":0.5911862850189209},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5763400793075562},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.5376464128494263},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5171788930892944},{"id":"https://openalex.org/C27511587","wikidata":"https://www.wikidata.org/wiki/Q2178623","display_name":"Spatial relation","level":2,"score":0.5033645033836365},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.48752281069755554},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.4460747539997101},{"id":"https://openalex.org/C45347329","wikidata":"https://www.wikidata.org/wiki/Q5166604","display_name":"Convolution (computer science)","level":3,"score":0.4421963393688202},{"id":"https://openalex.org/C142853389","wikidata":"https://www.wikidata.org/wiki/Q744778","display_name":"Association (psychology)","level":2,"score":0.4177358150482178},{"id":"https://openalex.org/C140146324","wikidata":"https://www.wikidata.org/wiki/Q1144319","display_name":"Predicate (mathematical logic)","level":2,"score":0.41551920771598816},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.38780784606933594},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.35800251364707947},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3263102173805237},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3031849265098572},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.16107818484306335},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3343031.3351058","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3343031.3351058","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 27th ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":14,"referenced_works":["https://openalex.org/W1964846093","https://openalex.org/W2049705550","https://openalex.org/W2117539524","https://openalex.org/W2252355370","https://openalex.org/W2579549467","https://openalex.org/W2603203130","https://openalex.org/W2765137706","https://openalex.org/W2807021761","https://openalex.org/W2889418103","https://openalex.org/W2963791934","https://openalex.org/W2963854930","https://openalex.org/W2987123286","https://openalex.org/W3100848837","https://openalex.org/W3104218139"],"related_works":["https://openalex.org/W3125011624","https://openalex.org/W1508631387","https://openalex.org/W2370917603","https://openalex.org/W2017776670","https://openalex.org/W2952760143","https://openalex.org/W2347897961","https://openalex.org/W2979236518","https://openalex.org/W2358318464","https://openalex.org/W2340870721","https://openalex.org/W3091955004"],"abstract_inverted_index":{"What":[0],"we":[1,75],"perceive":[2],"from":[3,36],"visual":[4,33],"content":[5],"are":[6,50],"not":[7],"only":[8],"collections":[9],"of":[10,30,41,106,187],"objects":[11,115],"but":[12],"the":[13,21,42,61,144,155,159,178],"interactions":[14],"between":[15],"them.":[16],"Visual":[17],"relations,":[18],"denoted":[19],"by":[20,180],"triplet":[22],"<subject,":[23],"predicate,":[24],"object>,":[25],"could":[26],"convey":[27],"a":[28,66,93,128,181,185],"wealth":[29],"information":[31],"for":[32,133,150],"understanding.":[34],"Different":[35],"static":[37],"images":[38],"and":[39,56,69,85,143,184],"because":[40],"additional":[43],"temporal":[44,57],"channel,":[45],"dynamic":[46,120],"relations":[47],"in":[48,53,64,88,158],"videos":[49,65,77],"often":[51],"correlated":[52],"both":[54],"spatial":[55],"dimensions,":[58],"which":[59],"make":[60,111],"relation":[62,135,152],"detection":[63,153],"more":[67],"complex":[68],"challenging":[70],"task.":[71],"In":[72],"this":[73],"paper,":[74],"abstract":[76],"into":[78],"fully-connected":[79],"spatial-temporal":[80,107],"graphs.":[81],"We":[82,162],"pass":[83],"message":[84],"conduct":[86],"reasoning":[87],"these":[89],"3D":[90],"graphs":[91],"with":[92,127],"novel":[94],"VidVRD":[95],"model":[96,102,141],"using":[97],"graph":[98],"convolution":[99],"network.":[100],"Our":[101],"can":[103],"take":[104],"advantage":[105],"contextual":[108],"cues":[109],"to":[110],"better":[112],"predictions":[113],"on":[114,166],"as":[116,118],"well":[117],"their":[119],"relationships.":[121],"Furthermore,":[122],"an":[123],"online":[124],"association":[125,146],"method":[126],"siamese":[129],"network":[130],"is":[131],"proposed":[132,145],"accurate":[134],"instances":[136],"association.":[137],"By":[138],"combining":[139],"our":[140,148,164,175,191],"(VRD-GCN)":[142],"method,":[147],"framework":[149,176],"video":[151],"achieves":[154],"best":[156],"performance":[157],"latest":[160],"benchmarks.":[161],"validate":[163],"approach":[165],"benchmark":[167],"ImageNet-VidVRD":[168],"dataset.":[169],"The":[170],"experimental":[171],"results":[172],"show":[173],"that":[174],"outperforms":[177],"state-of-the-art":[179],"large":[182],"margin":[183],"series":[186],"ablation":[188],"studies":[189],"demonstrate":[190],"method's":[192],"effectiveness.":[193]},"counts_by_year":[{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":11},{"year":2023,"cited_by_count":15},{"year":2022,"cited_by_count":13},{"year":2021,"cited_by_count":21},{"year":2020,"cited_by_count":11},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
