{"id":"https://openalex.org/W2924996095","doi":"https://doi.org/10.1109/cvpr.2019.01067","title":"Video Relationship Reasoning Using Gated Spatio-Temporal Energy Graph","display_name":"Video Relationship Reasoning Using Gated Spatio-Temporal Energy Graph","publication_year":2019,"publication_date":"2019-06-01","ids":{"openalex":"https://openalex.org/W2924996095","doi":"https://doi.org/10.1109/cvpr.2019.01067","mag":"2924996095"},"language":"en","primary_location":{"id":"doi:10.1109/cvpr.2019.01067","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr.2019.01067","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1903.10547","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5015826285","display_name":"Yao-Hung Hubert Tsai","orcid":"https://orcid.org/0000-0001-5312-1875"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Yao-Hung Hubert Tsai","raw_affiliation_strings":["Carnegie Mellon Univ","Carnegie Mellon University"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon Univ","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"Carnegie Mellon University","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046849436","display_name":"Santosh Divvala","orcid":"https://orcid.org/0000-0003-4042-5874"},"institutions":[{"id":"https://openalex.org/I4210140341","display_name":"Allen Institute","ror":"https://ror.org/03cpe7c52","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I4210140341"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Santosh Divvala","raw_affiliation_strings":["Allen Institute for AI","[Allen Institute for AI.]"],"affiliations":[{"raw_affiliation_string":"Allen Institute for AI","institution_ids":["https://openalex.org/I4210140341"]},{"raw_affiliation_string":"[Allen Institute for AI.]","institution_ids":["https://openalex.org/I4210140341"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081398601","display_name":"Louis\u2013Philippe Morency","orcid":"https://orcid.org/0000-0001-6376-7696"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Louis-Philippe Morency","raw_affiliation_strings":["Carnegie Mellon Univ","Carnegie Mellon University"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon Univ","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"Carnegie Mellon University","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071983998","display_name":"Ruslan Salakhutdinov","orcid":"https://orcid.org/0000-0002-3752-2756"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ruslan Salakhutdinov","raw_affiliation_strings":["Carnegie Mellon Univ","Carnegie Mellon University"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon Univ","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"Carnegie Mellon University","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101576595","display_name":"Ali Farhadi","orcid":"https://orcid.org/0000-0001-7249-2380"},"institutions":[{"id":"https://openalex.org/I4210156221","display_name":"Allen Institute for Artificial Intelligence","ror":"https://ror.org/05w520734","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I4210156221"]},{"id":"https://openalex.org/I201448701","display_name":"University of Washington","ror":"https://ror.org/00cvxb145","country_code":"US","type":"education","lineage":["https://openalex.org/I201448701"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ali Farhadi","raw_affiliation_strings":["Univ. of Washington, Allen Institute for Artificial Intelligence"],"affiliations":[{"raw_affiliation_string":"Univ. of Washington, Allen Institute for Artificial Intelligence","institution_ids":["https://openalex.org/I4210156221","https://openalex.org/I201448701"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5015826285"],"corresponding_institution_ids":["https://openalex.org/I74973139"],"apc_list":null,"apc_paid":null,"fwci":1.226,"has_fulltext":true,"cited_by_count":14,"citation_normalized_percentile":{"value":0.83148636,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"10416","last_page":"10425"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7364185452461243},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.5782572031021118},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5744500160217285},{"id":"https://openalex.org/keywords/lift","display_name":"Lift (data mining)","score":0.5463417768478394},{"id":"https://openalex.org/keywords/conditional-random-field","display_name":"Conditional random field","score":0.5399413704872131},{"id":"https://openalex.org/keywords/visual-reasoning","display_name":"Visual reasoning","score":0.5078192353248596},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.48605018854141235},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.47479408979415894},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.45503732562065125},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.44737565517425537},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.43499070405960083},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.42301246523857117},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.325130820274353}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7364185452461243},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.5782572031021118},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5744500160217285},{"id":"https://openalex.org/C139002025","wikidata":"https://www.wikidata.org/wiki/Q3001212","display_name":"Lift (data mining)","level":2,"score":0.5463417768478394},{"id":"https://openalex.org/C152565575","wikidata":"https://www.wikidata.org/wiki/Q1124538","display_name":"Conditional random field","level":2,"score":0.5399413704872131},{"id":"https://openalex.org/C2777508537","wikidata":"https://www.wikidata.org/wiki/Q7936620","display_name":"Visual reasoning","level":2,"score":0.5078192353248596},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.48605018854141235},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.47479408979415894},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.45503732562065125},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.44737565517425537},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.43499070405960083},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.42301246523857117},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.325130820274353},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/cvpr.2019.01067","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr.2019.01067","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1903.10547","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1903.10547","pdf_url":"https://arxiv.org/pdf/1903.10547","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"mag:2924996095","is_oa":true,"landing_page_url":"http://export.arxiv.org/pdf/1903.10547","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"doi:10.48550/arxiv.1903.10547","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1903.10547","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:1903.10547","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1903.10547","pdf_url":"https://arxiv.org/pdf/1903.10547","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1219216712","display_name":"III: Medium: Learning Multimodal Knowledge about Entities and Events","funder_award_id":"1703166","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G2519087326","display_name":"NRI: Collaborative Research: Experiential Learning for Robots: From Physics to Actions to Tasks","funder_award_id":"1637479","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G3550935145","display_name":null,"funder_award_id":"N000141812861","funder_id":"https://openalex.org/F4320337345","funder_display_name":"Office of Naval Research"},{"id":"https://openalex.org/G382805209","display_name":"AF: RI: Medium: Collaborative Research: Understanding and Improving Optimization in Deep and Recurrent Networks","funder_award_id":"1763562","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G4713059963","display_name":null,"funder_award_id":"FA8750","funder_id":"https://openalex.org/F4320332180","funder_display_name":"Defense Advanced Research Projects Agency"},{"id":"https://openalex.org/G574185058","display_name":null,"funder_award_id":"1722822","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G6894402473","display_name":null,"funder_award_id":"Fellowship","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G8289405913","display_name":"SHF:Small: Collaborative Research: Understanding, Modeling, and System Support for HPC Data Reduction","funder_award_id":"1812861","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G848032724","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G8876996369","display_name":null,"funder_award_id":"N00014","funder_id":"https://openalex.org/F4320337345","funder_display_name":"Office of Naval Research"},{"id":"https://openalex.org/G946752494","display_name":null,"funder_award_id":"IIS1763562","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320309480","display_name":"Nvidia","ror":"https://ror.org/03jdj4y14"},{"id":"https://openalex.org/F4320332180","display_name":"Defense Advanced Research Projects Agency","ror":"https://ror.org/02caytj08"},{"id":"https://openalex.org/F4320337345","display_name":"Office of Naval Research","ror":"https://ror.org/00rk2pe57"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2924996095.pdf","grobid_xml":"https://content.openalex.org/works/W2924996095.grobid-xml"},"referenced_works_count":44,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W1905533542","https://openalex.org/W2049705550","https://openalex.org/W2054141820","https://openalex.org/W2097073572","https://openalex.org/W2101534792","https://openalex.org/W2105101328","https://openalex.org/W2115096495","https://openalex.org/W2117539524","https://openalex.org/W2124592697","https://openalex.org/W2161236525","https://openalex.org/W2250539671","https://openalex.org/W2479423890","https://openalex.org/W2583815496","https://openalex.org/W2591644541","https://openalex.org/W2607855566","https://openalex.org/W2608988379","https://openalex.org/W2625366777","https://openalex.org/W2765137706","https://openalex.org/W2788537604","https://openalex.org/W2806331055","https://openalex.org/W2883170015","https://openalex.org/W2889811054","https://openalex.org/W2919115771","https://openalex.org/W2963091558","https://openalex.org/W2963165299","https://openalex.org/W2963403868","https://openalex.org/W2963524571","https://openalex.org/W2963536419","https://openalex.org/W2963650529","https://openalex.org/W6631782140","https://openalex.org/W6637967152","https://openalex.org/W6649598916","https://openalex.org/W6674723063","https://openalex.org/W6674793120","https://openalex.org/W6675533928","https://openalex.org/W6680642335","https://openalex.org/W6684853950","https://openalex.org/W6703281212","https://openalex.org/W6721769334","https://openalex.org/W6739901393","https://openalex.org/W6746036303","https://openalex.org/W6746798562","https://openalex.org/W6955071965"],"related_works":["https://openalex.org/W2982515679","https://openalex.org/W2981895973","https://openalex.org/W2765137706","https://openalex.org/W3203247536","https://openalex.org/W2970603704","https://openalex.org/W3035503132","https://openalex.org/W2981385984","https://openalex.org/W2951323451","https://openalex.org/W1861492603","https://openalex.org/W3207158043","https://openalex.org/W2770804203","https://openalex.org/W2803258434","https://openalex.org/W3094619608","https://openalex.org/W3002007234","https://openalex.org/W2894669491","https://openalex.org/W2798827082","https://openalex.org/W3118473641","https://openalex.org/W3128159636","https://openalex.org/W2926309785","https://openalex.org/W3136412255"],"abstract_inverted_index":{"Visual":[0],"relationship":[1,19,189],"reasoning":[2,190],"is":[3,158,166],"a":[4,18,24,71,119,124,141],"crucial":[5],"yet":[6],"challenging":[7],"task":[8],"for":[9],"understanding":[10,49],"rich":[11],"interactions":[12],"across":[13,186],"visual":[14,50,76,153],"concepts.":[15],"For":[16],"example,":[17],"{man,":[20,31,86,91],"open,":[21],"door}":[22],"involves":[23],"complex":[25],"relation":[26],"{open}":[27],"between":[28,133],"concrete":[29],"entities":[30,135],"door}.":[32],"While":[33],"much":[34],"of":[35,46,75],"the":[36,44,130],"existing":[37],"work":[38],"has":[39,54],"studied":[40],"this":[41,115],"problem":[42],"in":[43,52],"context":[45],"still":[47],"images,":[48],"relationships":[51,98],"videos":[53,63],"received":[55],"limited":[56],"attention.":[57],"Due":[58],"to":[59,66],"their":[60],"temporal":[61],"nature,":[62],"enable":[64],"us":[65],"model":[67,156],"and":[68,137,161,181,194],"reason":[69],"about":[70],"more":[72],"comprehensive":[73],"set":[74],"relationships,":[77],"such":[78],"as":[79,95,97],"those":[80],"requiring":[81],"multiple":[82],"(temporal)":[83],"observations":[84],"(e.g.,":[85,105],"lift":[87],"up,":[88],"box}":[89],"vs.":[90],"put":[92],"down,":[93],"box}),":[94],"well":[96],"that":[99,128,147],"are":[100],"often":[101],"correlated":[102],"through":[103,169],"time":[104],"{woman,":[106,111],"pay,":[107],"money}":[108],"followed":[109],"by":[110],"buy,":[112],"coffee}).":[113],"In":[114],"paper,":[116],"we":[117],"construct":[118],"Conditional":[120],"Random":[121],"Field":[122],"on":[123,152,175],"fully-connected":[125],"spatiotemporal":[126],"graph":[127],"exploits":[129],"statistical":[131],"dependency":[132],"relational":[134],"spatially":[136],"temporally.":[138],"We":[139],"introduce":[140],"novel":[142],"gated":[143],"energy":[144],"function":[145],"parametrization":[146],"learns":[148],"adaptive":[149],"relations":[150],"conditioned":[151],"observations.":[154],"Our":[155],"optimization":[157],"computationally":[159],"efficient,":[160],"its":[162],"space":[163],"computation":[164],"complexity":[165],"significantly":[167],"amortized":[168],"our":[170],"proposed":[171],"parameterization.":[172],"Experimental":[173],"results":[174],"benchmark":[176],"video":[177],"datasets":[178],"(ImageNet":[179],"Video":[180],"Charades)":[182],"demonstrate":[183],"state-of-the-art":[184],"performance":[185],"three":[187],"standard":[188],"tasks:":[191],"Detection,":[192],"Tagging,":[193],"Recognition.":[195]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":6},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
