{"id":"https://openalex.org/W2951143549","doi":"https://doi.org/10.1109/tcsvt.2019.2923712","title":"Spatial\u2013Temporal Context-Aware Online Action Detection and Prediction","display_name":"Spatial\u2013Temporal Context-Aware Online Action Detection and Prediction","publication_year":2019,"publication_date":"2019-06-19","ids":{"openalex":"https://openalex.org/W2951143549","doi":"https://doi.org/10.1109/tcsvt.2019.2923712","mag":"2951143549"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2019.2923712","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2019.2923712","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5017136081","display_name":"Jingjia Huang","orcid":"https://orcid.org/0000-0002-0834-3265"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]},{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingjia Huang","raw_affiliation_strings":["School of Electronic and Computer Engineering, Peking University Shenzhen Graduate School, Shenzhen, China","Peng Cheng Laboratory, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0002-0834-3265","affiliations":[{"raw_affiliation_string":"School of Electronic and Computer Engineering, Peking University Shenzhen Graduate School, Shenzhen, China","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"Peng Cheng Laboratory, Shenzhen, China","institution_ids":["https://openalex.org/I4210136793"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100419527","display_name":"Nannan Li","orcid":"https://orcid.org/0000-0002-8274-5123"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]},{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Nannan Li","raw_affiliation_strings":["School of Electronic and Computer Engineering, Peking University Shenzhen Graduate School, Shenzhen, China","Peng Cheng Laboratory, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0002-8274-5123","affiliations":[{"raw_affiliation_string":"School of Electronic and Computer Engineering, Peking University Shenzhen Graduate School, Shenzhen, China","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"Peng Cheng Laboratory, Shenzhen, China","institution_ids":["https://openalex.org/I4210136793"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101509081","display_name":"Thomas Li","orcid":"https://orcid.org/0000-0001-9950-4679"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Thomas Li","raw_affiliation_strings":["AIIT, Peking University, Hangzhou, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"AIIT, Peking University, Hangzhou, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100449791","display_name":"Shan Liu","orcid":"https://orcid.org/0000-0002-1442-1207"},"institutions":[{"id":"https://openalex.org/I70745867","display_name":"KLA (United States)","ror":"https://ror.org/02rqhpa98","country_code":"US","type":"company","lineage":["https://openalex.org/I70745867"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shan Liu","raw_affiliation_strings":["Tencent Media Lab, Palo Alto, CA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tencent Media Lab, Palo Alto, CA, USA","institution_ids":["https://openalex.org/I70745867"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100447691","display_name":"Ge Li","orcid":"https://orcid.org/0000-0003-0140-0949"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ge Li","raw_affiliation_strings":["School of Electronic and Computer Engineering, Peking University Shenzhen Graduate School, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0003-0140-0949","affiliations":[{"raw_affiliation_string":"School of Electronic and Computer Engineering, Peking University Shenzhen Graduate School, Shenzhen, China","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.3219,"has_fulltext":false,"cited_by_count":31,"citation_normalized_percentile":{"value":0.84477302,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"30","issue":"8","first_page":"2650","last_page":"2662"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9955000281333923,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/snippet","display_name":"Snippet","score":0.9260014295578003},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8459728956222534},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6548815965652466},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.6285102963447571},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.6132758855819702},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.5868854522705078},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5220910310745239},{"id":"https://openalex.org/keywords/bounding-overwatch","display_name":"Bounding overwatch","score":0.5183021426200867},{"id":"https://openalex.org/keywords/spatial-contextual-awareness","display_name":"Spatial contextual awareness","score":0.4733189046382904},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.46254631876945496},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.44335824251174927},{"id":"https://openalex.org/keywords/context-model","display_name":"Context model","score":0.428086519241333},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.42359843850135803},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4210949242115021},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.37617161870002747},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.13038960099220276}],"concepts":[{"id":"https://openalex.org/C2777822670","wikidata":"https://www.wikidata.org/wiki/Q1120538","display_name":"Snippet","level":2,"score":0.9260014295578003},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8459728956222534},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6548815965652466},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6285102963447571},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.6132758855819702},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.5868854522705078},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5220910310745239},{"id":"https://openalex.org/C63584917","wikidata":"https://www.wikidata.org/wiki/Q333286","display_name":"Bounding overwatch","level":2,"score":0.5183021426200867},{"id":"https://openalex.org/C64754055","wikidata":"https://www.wikidata.org/wiki/Q7574053","display_name":"Spatial contextual awareness","level":2,"score":0.4733189046382904},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.46254631876945496},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.44335824251174927},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.428086519241333},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.42359843850135803},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4210949242115021},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.37617161870002747},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.13038960099220276},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsvt.2019.2923712","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2019.2923712","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.550000011920929,"display_name":"Peace, Justice and strong institutions"}],"awards":[{"id":"https://openalex.org/G3841787934","display_name":null,"funder_award_id":"61602014","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":51,"referenced_works":["https://openalex.org/W24089286","https://openalex.org/W589665618","https://openalex.org/W639708223","https://openalex.org/W753012316","https://openalex.org/W1522734439","https://openalex.org/W1559046793","https://openalex.org/W1686810756","https://openalex.org/W1797109199","https://openalex.org/W1923332106","https://openalex.org/W1923404803","https://openalex.org/W1947481528","https://openalex.org/W2016053056","https://openalex.org/W2018068650","https://openalex.org/W2034014085","https://openalex.org/W2064675550","https://openalex.org/W2101194540","https://openalex.org/W2102605133","https://openalex.org/W2105101328","https://openalex.org/W2126579184","https://openalex.org/W2157331557","https://openalex.org/W2175354415","https://openalex.org/W2290998037","https://openalex.org/W2326543519","https://openalex.org/W2342662179","https://openalex.org/W2345308841","https://openalex.org/W2460134573","https://openalex.org/W2472293097","https://openalex.org/W2519080876","https://openalex.org/W2605704591","https://openalex.org/W2610147486","https://openalex.org/W2611596598","https://openalex.org/W2613718673","https://openalex.org/W2751445731","https://openalex.org/W2779250840","https://openalex.org/W2792312609","https://openalex.org/W2913950831","https://openalex.org/W2943070176","https://openalex.org/W2962722947","https://openalex.org/W2962803561","https://openalex.org/W2963149042","https://openalex.org/W2963528106","https://openalex.org/W6600983433","https://openalex.org/W6617526114","https://openalex.org/W6620707391","https://openalex.org/W6622239757","https://openalex.org/W6637373629","https://openalex.org/W6640257725","https://openalex.org/W6685670348","https://openalex.org/W6725589990","https://openalex.org/W6734051801","https://openalex.org/W6736402229"],"related_works":["https://openalex.org/W4321784794","https://openalex.org/W2900482274","https://openalex.org/W2140435402","https://openalex.org/W4235055075","https://openalex.org/W4285276086","https://openalex.org/W2161633202","https://openalex.org/W2039787362","https://openalex.org/W1750537857","https://openalex.org/W2163490908","https://openalex.org/W2901621883"],"abstract_inverted_index":{"Spatial-temporal":[0],"action":[1,21,40,50,77,86,100,159,187,194],"detection":[2,22,26,32,41,67,78,87,160,195],"in":[3,14,60,68,79,96,145,196],"videos":[4,97],"is":[5,74,121],"a":[6,124,132],"challenging":[7],"problem":[8],"that":[9,89,120,181,223],"has":[10],"attracted":[11],"considerable":[12],"attention":[13],"recent":[15],"years.":[16],"Most":[17],"current":[18,163],"approaches":[19],"address":[20],"as":[23,35,135],"an":[24,61,84,117,176,197],"object":[25,31,66],"problem,":[27],"which":[28],"utilizes":[29],"successful":[30],"frameworks":[33],"such":[34],"Faster":[36],"R-CNN":[37],"to":[38,98,108,185,234],"operate":[39],"at":[42,168],"every":[43],"single":[44],"frame":[45],"first,":[46],"and":[47,102,137,192,217],"then":[48],"generates":[49],"tubes":[51],"by":[52],"linking":[53],"bounding":[54],"boxes":[55],"across":[56],"the":[57,91,110,139,143,146,150,153,156,162,202,235],"whole":[58],"video":[59,133],"offline":[62],"fashion.":[63,199],"However,":[64],"unlike":[65],"static":[69],"images,":[70],"temporal":[71],"context":[72,93,112],"information":[73,94,141,157],"vital":[75],"for":[76,158],"videos.":[80],"Therefore,":[81],"we":[82,106,174,207,242],"propose":[83],"online":[85,198],"model":[88,119,130,184],"leverages":[90],"spatial-temporal":[92,111],"existing":[95],"perform":[99],"inference":[101],"localization.":[103],"More":[104],"specifically,":[105],"try":[107],"depict":[109],"pattern":[113],"of":[114,190,204],"actions":[115],"via":[116],"encoder-decoder":[118],"based":[122],"on":[123,210,246],"convolutional":[125],"recurrent":[126],"neural":[127],"network.":[128],"The":[129,219],"accepts":[131],"snippet":[134,144],"input":[136],"encodes":[138],"dynamic":[140],"inside":[142],"forward":[147],"pass.":[148],"During":[149],"backward":[151],"pass,":[152],"decoder":[154],"resolves":[155],"with":[161],"appearance":[164],"or":[165,229],"motion":[166],"cue":[167],"each":[169],"time":[170,191],"stamp.":[171],"In":[172],"addition,":[173],"devise":[175],"incremental":[177],"action-tube":[178],"construction":[179],"algorithm":[180],"enables":[182],"our":[183,205,224,244],"accomplish":[186],"prediction":[188],"ahead":[189],"performs":[193],"To":[200,238],"evaluate":[201],"performance":[203,231],"method,":[206],"conduct":[208],"experiments":[209],"three":[211],"popular":[212],"public":[213],"datasets":[214],"UCF-101,":[215],"UCF-Sports,":[216],"J-HMDB-21.":[218],"experimental":[220],"results":[221],"demonstrate":[222],"method":[225],"can":[226],"achieve":[227],"competitive":[228],"superior":[230],"when":[232],"compared":[233],"state-of-the-art":[236],"methods.":[237],"encourage":[239],"further":[240],"research,":[241],"release":[243],"project":[245],"\u201chttps://github.com.hjjpku.OATD.\u201d":[247]},"counts_by_year":[{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":6},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":3}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
