{"id":"https://openalex.org/W3045491988","doi":"https://doi.org/10.1109/iwcmc48107.2020.9148294","title":"KSF-ST: Video Captioning Based on Key Semantic Frames Extraction and Spatio-Temporal Attention Mechanism","display_name":"KSF-ST: Video Captioning Based on Key Semantic Frames Extraction and Spatio-Temporal Attention Mechanism","publication_year":2020,"publication_date":"2020-06-01","ids":{"openalex":"https://openalex.org/W3045491988","doi":"https://doi.org/10.1109/iwcmc48107.2020.9148294","mag":"3045491988"},"language":"en","primary_location":{"id":"doi:10.1109/iwcmc48107.2020.9148294","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iwcmc48107.2020.9148294","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 International Wireless Communications and Mobile Computing (IWCMC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101712268","display_name":"Zhaowei Qu","orcid":"https://orcid.org/0000-0002-9982-2359"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhaowei Qu","raw_affiliation_strings":["Beijing Key Laboratory of Network System and Network Culture, Beijing University of Posts and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing Key Laboratory of Network System and Network Culture, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023438758","display_name":"Luhan Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Luhan Zhang","raw_affiliation_strings":["Beijing Key Laboratory of Network System and Network Culture, Beijing University of Posts and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing Key Laboratory of Network System and Network Culture, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102020015","display_name":"Xiaoru Wang","orcid":"https://orcid.org/0000-0001-7171-2783"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoru Wang","raw_affiliation_strings":["Beijing Key Laboratory of Network System and Network Culture, Beijing University of Posts and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing Key Laboratory of Network System and Network Culture, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012733727","display_name":"Bingyu Cao","orcid":null},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bingyu Cao","raw_affiliation_strings":["Beijing Key Laboratory of Network System and Network Culture, Beijing University of Posts and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing Key Laboratory of Network System and Network Culture, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102949073","display_name":"Yueli Li","orcid":null},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yueli Li","raw_affiliation_strings":["Beijing Key Laboratory of Network System and Network Culture, Beijing University of Posts and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing Key Laboratory of Network System and Network Culture, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100324319","display_name":"Fu Li","orcid":"https://orcid.org/0000-0003-0319-0308"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fu Li","raw_affiliation_strings":["Department of Electrical and Computer Engineering, Portland States University, Portland, OR, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Portland States University, Portland, OR, USA","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5101712268"],"corresponding_institution_ids":["https://openalex.org/I139759216"],"apc_list":null,"apc_paid":null,"fwci":0.0977,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.38828393,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1388","last_page":"1393"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.8968483209609985},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8508343696594238},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6076070070266724},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.6071227788925171},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.5456212162971497},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5383468866348267},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.5210796594619751},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.5184080600738525},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.512367844581604},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4317758083343506},{"id":"https://openalex.org/keywords/information-extraction","display_name":"Information extraction","score":0.41310277581214905},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3980647921562195},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3350645899772644},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.21023645997047424},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.17564162611961365}],"concepts":[{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.8968483209609985},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8508343696594238},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6076070070266724},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.6071227788925171},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.5456212162971497},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5383468866348267},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.5210796594619751},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.5184080600738525},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.512367844581604},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4317758083343506},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.41310277581214905},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3980647921562195},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3350645899772644},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.21023645997047424},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.17564162611961365},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iwcmc48107.2020.9148294","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iwcmc48107.2020.9148294","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 International Wireless Communications and Mobile Computing (IWCMC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.6000000238418579,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":27,"referenced_works":["https://openalex.org/W65273053","https://openalex.org/W1492731187","https://openalex.org/W1522734439","https://openalex.org/W1840179877","https://openalex.org/W1956340063","https://openalex.org/W2016053056","https://openalex.org/W2085425470","https://openalex.org/W2106818711","https://openalex.org/W2133564696","https://openalex.org/W2139501017","https://openalex.org/W2164290393","https://openalex.org/W2358543963","https://openalex.org/W2425121537","https://openalex.org/W2587809655","https://openalex.org/W2884585870","https://openalex.org/W2962681491","https://openalex.org/W2962990649","https://openalex.org/W2963971014","https://openalex.org/W2964152081","https://openalex.org/W4246959375","https://openalex.org/W6629393784","https://openalex.org/W6641064462","https://openalex.org/W6683167905","https://openalex.org/W6684090549","https://openalex.org/W6719456621","https://openalex.org/W6753412334","https://openalex.org/W7001715179"],"related_works":["https://openalex.org/W4210416330","https://openalex.org/W2775506363","https://openalex.org/W3088136942","https://openalex.org/W4290852288","https://openalex.org/W2949362007","https://openalex.org/W4283207562","https://openalex.org/W2963177403","https://openalex.org/W3009270862","https://openalex.org/W2329000834","https://openalex.org/W2165504147"],"abstract_inverted_index":{"Video":[0],"captioning":[1,13,114,212],"is":[2,139,152,178],"one":[3],"of":[4,33,40,48,58,65,67,146,172],"research":[5],"hotspots":[6],"in":[7,56,127,160],"computer":[8],"vision.":[9],"At":[10],"present,":[11],"video":[12,27,49,113,147,173,211],"algorithms":[14,21,68,72],"mainly":[15],"have":[16,198],"following":[17],"problems:":[18],"First,":[19],"traditional":[20,71],"use":[22],"equal-interval":[23,52],"sampling":[24,53],"to":[25,45,101,132,141,154,166,183],"extract":[26,133,167],"features,":[28],"which":[29],"causes":[30],"the":[31,46,63,82,86,112,156,161,202,215],"loss":[32],"key":[34,118,134,143],"frames":[35,120],"containing":[36],"a":[37],"large":[38],"amount":[39,64],"semantic":[41,93,119,135,144,170],"information,":[42],"thus":[43],"leading":[44],"inaccuracy":[47],"captioning.":[50],"Moreover,":[51],"method":[54,115],"results":[55,203],"lots":[57],"redundant":[59],"frames,":[60,136,148,174],"thereby":[61],"increasing":[62],"computation":[66],"extremely.":[69],"Second,":[70],"only":[73],"consider":[74],"temporal":[75,97,181],"information":[76,145,171],"when":[77],"extracting":[78,96],"features.":[79],"However,":[80],"for":[81],"image":[83],"and":[84,122,149,201],"video,":[85],"spatial":[87,168,175],"features":[88,98,182],"also":[89],"contain":[90],"rich":[91],"latent":[92,169],"information.":[94],"Only":[95],"will":[99],"lead":[100],"inaccurate":[102],"natural":[103,186],"language":[104,187],"descriptions.":[105,188],"To":[106],"address":[107],"these":[108],"problems,":[109],"we":[110],"propose":[111],"based":[116],"on":[117,192],"extraction":[121],"spatio-temporal":[123],"attention":[124,176],"mechanism":[125,177],"(KSF-ST)":[126],"this":[128],"paper.":[129],"In":[130,164],"order":[131,165],"knowledge":[137,150,162],"graph":[138],"adopted":[140],"obtain":[142,155],"reasoning":[151],"used":[153],"correlation":[157],"among":[158],"entities":[159],"graph.":[163],"combined":[179],"with":[180],"generate":[184],"accurate":[185],"We":[189],"evaluate":[190],"KSF-ST":[191],"two":[193],"benchmark":[194],"datasets.":[195],"Extensive":[196],"experiments":[197],"been":[199],"conducted":[200],"demonstrate":[204],"that":[205],"our":[206],"algorithm":[207],"could":[208],"achieve":[209],"better":[210],"performance":[213],"than":[214],"state-of-the-art":[216],"algorithms.":[217]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
