{"id":"https://openalex.org/W2970898753","doi":"https://doi.org/10.1109/tpami.2020.3038993","title":"Semantic Conditioned Dynamic Modulation for Temporal Sentence Grounding in Videos","display_name":"Semantic Conditioned Dynamic Modulation for Temporal Sentence Grounding in Videos","publication_year":2020,"publication_date":"2020-01-01","ids":{"openalex":"https://openalex.org/W2970898753","doi":"https://doi.org/10.1109/tpami.2020.3038993","mag":"2970898753","pmid":"https://pubmed.ncbi.nlm.nih.gov/33206601"},"language":"en","primary_location":{"id":"doi:10.1109/tpami.2020.3038993","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2020.3038993","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5011133696","display_name":"Yitian Yuan","orcid":"https://orcid.org/0000-0001-8701-7689"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]},{"id":"https://openalex.org/I4210114105","display_name":"Tsinghua\u2013Berkeley Shenzhen Institute","ror":"https://ror.org/02hhwwz98","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210114105","https://openalex.org/I95457486","https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yitian Yuan","raw_affiliation_strings":["Tsinghua-Berkeley Shenzhen Institute, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua-Berkeley Shenzhen Institute, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I4210114105","https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017116858","display_name":"Lin Ma","orcid":"https://orcid.org/0000-0002-7331-6132"},"institutions":[{"id":"https://openalex.org/I4210087373","display_name":"Meizu (China)","ror":"https://ror.org/0067g4302","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210087373"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lin Ma","raw_affiliation_strings":["Meituan, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Meituan, Beijing, China","institution_ids":["https://openalex.org/I4210087373"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100461874","display_name":"Jingwen Wang","orcid":"https://orcid.org/0000-0002-1405-4697"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingwen Wang","raw_affiliation_strings":["Tencent AI Lab, Shenzhen, Guandong, China"],"affiliations":[{"raw_affiliation_string":"Tencent AI Lab, Shenzhen, Guandong, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100431792","display_name":"Wei Liu","orcid":"https://orcid.org/0000-0002-3865-8145"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Liu","raw_affiliation_strings":["Tencent AI Lab, Shenzhen, Guandong, China"],"affiliations":[{"raw_affiliation_string":"Tencent AI Lab, Shenzhen, Guandong, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100339293","display_name":"Wenwu Zhu","orcid":"https://orcid.org/0000-0003-2236-9290"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenwu Zhu","raw_affiliation_strings":["Department of Computer Science and Technology, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5011133696"],"corresponding_institution_ids":["https://openalex.org/I4210114105","https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":14.92,"has_fulltext":false,"cited_by_count":215,"citation_normalized_percentile":{"value":0.99304377,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"44","issue":"5","first_page":"1","last_page":"1"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":0.9911999702453613,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.8399821519851685},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8275573253631592},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5554422736167908},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.542214035987854},{"id":"https://openalex.org/keywords/convolution","display_name":"Convolution (computer science)","score":0.5138545036315918},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5088055729866028},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.46043696999549866},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.4260016083717346},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3564189076423645},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.07574737071990967},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.07514578104019165}],"concepts":[{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.8399821519851685},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8275573253631592},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5554422736167908},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.542214035987854},{"id":"https://openalex.org/C45347329","wikidata":"https://www.wikidata.org/wiki/Q5166604","display_name":"Convolution (computer science)","level":3,"score":0.5138545036315918},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5088055729866028},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.46043696999549866},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.4260016083717346},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3564189076423645},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.07574737071990967},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.07514578104019165},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tpami.2020.3038993","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2020.3038993","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},{"id":"pmid:33206601","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/33206601","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on pattern analysis and machine intelligence","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.41999998688697815}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":51,"referenced_works":["https://openalex.org/W129606432","https://openalex.org/W262578090","https://openalex.org/W1522734439","https://openalex.org/W1536680647","https://openalex.org/W1906515132","https://openalex.org/W1927052826","https://openalex.org/W2060300932","https://openalex.org/W2111078031","https://openalex.org/W2250539671","https://openalex.org/W2337252826","https://openalex.org/W2461621749","https://openalex.org/W2529163075","https://openalex.org/W2604114396","https://openalex.org/W2727849499","https://openalex.org/W2766402183","https://openalex.org/W2798354744","https://openalex.org/W2808647806","https://openalex.org/W2887928923","https://openalex.org/W2888456631","https://openalex.org/W2890502146","https://openalex.org/W2894280539","https://openalex.org/W2903901502","https://openalex.org/W2904824998","https://openalex.org/W2920582597","https://openalex.org/W2949888942","https://openalex.org/W2962677524","https://openalex.org/W2962869524","https://openalex.org/W2963017553","https://openalex.org/W2963155035","https://openalex.org/W2963354481","https://openalex.org/W2963521717","https://openalex.org/W2963524571","https://openalex.org/W2963662190","https://openalex.org/W2963916161","https://openalex.org/W2964089981","https://openalex.org/W2964138017","https://openalex.org/W2964274041","https://openalex.org/W2964350391","https://openalex.org/W2968356596","https://openalex.org/W3025323587","https://openalex.org/W3100481960","https://openalex.org/W4249736682","https://openalex.org/W4251194840","https://openalex.org/W6637373629","https://openalex.org/W6716109767","https://openalex.org/W6729110096","https://openalex.org/W6736356174","https://openalex.org/W6755310813","https://openalex.org/W6761268011","https://openalex.org/W6767312599","https://openalex.org/W6864424756"],"related_works":["https://openalex.org/W2378211422","https://openalex.org/W2745001401","https://openalex.org/W4321353415","https://openalex.org/W2130974462","https://openalex.org/W972276598","https://openalex.org/W4246352526","https://openalex.org/W2028665553","https://openalex.org/W4230315250","https://openalex.org/W2086519370","https://openalex.org/W2087343574"],"abstract_inverted_index":{"Temporal":[0],"sentence":[1,29,50,91,197],"grounding":[2,156,172],"in":[3,34],"videos":[4],"aims":[5],"to":[6,15,52,77,84,141,153],"localize":[7],"one":[8],"target":[9],"video":[10,32,65,80,105,193],"segment,":[11],"which":[12,47,137],"semantically":[13],"corresponds":[14],"a":[16,39,86,100],"given":[17],"sentence.":[18],"Unlike":[19],"previous":[20],"methods":[21],"mainly":[22],"focusing":[23],"on":[24,129,160,185],"matching":[25],"semantics":[26,51],"between":[27,90],"the":[28,49,54,63,78,96,125,130,134,143,147,165,170,181,187],"and":[30,61,92,113,150,175,190],"different":[31],"segments,":[33],"this":[35,202],"paper,":[36],"we":[37],"propose":[38],"novel":[40],"semantic":[41,88],"conditioned":[42],"dynamic":[43],"modulation":[44],"(SCDM)":[45],"mechanism,":[46],"leverages":[48],"modulate":[53],"temporal":[55,102,109,127,144,171,196],"convolution":[56,128],"operations":[57],"for":[58,195,201],"better":[59],"correlating":[60],"composing":[62],"sentence-relevant":[64],"contents":[66,81,194],"over":[67],"time.":[68],"The":[69],"proposed":[70,97,166],"SCDM":[71,98,184],"also":[72,122,179],"performs":[73],"dynamically":[74],"with":[75,99,107,124],"respect":[76],"diverse":[79],"so":[82],"as":[83],"establish":[85],"precise":[87],"alignment":[89],"video.":[93],"By":[94],"coupling":[95],"hierarchical":[101],"convolutional":[103],"architecture,":[104,136],"segments":[106,149],"various":[108],"scales":[110],"are":[111,121,138],"composed":[112],"localized.":[114],"Besides,":[115],"more":[116,154],"fine-grained":[117],"clip-level":[118],"actionness":[119],"scores":[120],"predicted":[123],"SCDM-coupled":[126],"bottom":[131],"layer":[132],"of":[133,146,183],"overall":[135],"further":[139,176],"used":[140],"adjust":[142],"boundaries":[145],"localized":[148],"thereby":[151],"lead":[152],"accurate":[155],"results.":[157],"Experimental":[158],"results":[159],"benchmark":[161],"datasets":[162],"demonstrate":[163],"that":[164],"model":[167,188],"can":[168],"improve":[169],"accuracy":[173],"consistently,":[174],"investigation":[177],"experiments":[178],"illustrate":[180],"advantages":[182],"stabilizing":[186],"training":[189],"associating":[191],"relevant":[192],"grounding.":[198],"Our":[199],"code":[200],"paper":[203],"is":[204],"available":[205],"at":[206],"https://github.com/yytzsy/SCDM-TPAMI.":[207]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":21},{"year":2024,"cited_by_count":39},{"year":2023,"cited_by_count":34},{"year":2022,"cited_by_count":42},{"year":2021,"cited_by_count":48},{"year":2020,"cited_by_count":28}],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-10T00:00:00"}
