{"id":"https://openalex.org/W4390904989","doi":"https://doi.org/10.1109/tiv.2024.3353172","title":"Anticipation Video Captioning of Aerial Refueling Based on Combined Attention Masking Mechanism","display_name":"Anticipation Video Captioning of Aerial Refueling Based on Combined Attention Masking Mechanism","publication_year":2024,"publication_date":"2024-01-16","ids":{"openalex":"https://openalex.org/W4390904989","doi":"https://doi.org/10.1109/tiv.2024.3353172"},"language":"en","primary_location":{"id":"doi:10.1109/tiv.2024.3353172","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tiv.2024.3353172","pdf_url":null,"source":{"id":"https://openalex.org/S4210199657","display_name":"IEEE Transactions on Intelligent Vehicles","issn_l":"2379-8858","issn":["2379-8858","2379-8904"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Vehicles","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5066900102","display_name":"Shuai Wu","orcid":"https://orcid.org/0000-0001-7713-1808"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuai Wu","raw_affiliation_strings":["School of Computer Science, Fudan University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0001-7713-1808","affiliations":[{"raw_affiliation_string":"School of Computer Science, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070954480","display_name":"Wei Tong","orcid":"https://orcid.org/0000-0002-8558-1822"},"institutions":[{"id":"https://openalex.org/I41198531","display_name":"Nanjing University of Posts and Telecommunications","ror":"https://ror.org/043bpky34","country_code":"CN","type":"education","lineage":["https://openalex.org/I41198531"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Tong","raw_affiliation_strings":["College of Automation and College of Artificial Intelligence, Nanjing University of Posts and Telecommunications, Nanjing, China"],"raw_orcid":"https://orcid.org/0000-0002-8558-1822","affiliations":[{"raw_affiliation_string":"College of Automation and College of Artificial Intelligence, Nanjing University of Posts and Telecommunications, Nanjing, China","institution_ids":["https://openalex.org/I41198531"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037392372","display_name":"Ya Duan","orcid":"https://orcid.org/0009-0008-7274-390X"},"institutions":[{"id":"https://openalex.org/I4210095084","display_name":"Zhongji Test Equipment (China)","ror":"https://ror.org/00p24re17","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210095084"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ya Duan","raw_affiliation_strings":["Flight Test Technology and Engineering Center, Chinese Flight Test Establishment, Xi&#x0027;an, China"],"raw_orcid":"https://orcid.org/0009-0008-7274-390X","affiliations":[{"raw_affiliation_string":"Flight Test Technology and Engineering Center, Chinese Flight Test Establishment, Xi&#x0027;an, China","institution_ids":["https://openalex.org/I4210095084"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101865874","display_name":"Weidong Yang","orcid":"https://orcid.org/0000-0002-6473-9272"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weidong Yang","raw_affiliation_strings":["School of Computer Science, Fudan University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0002-6473-9272","affiliations":[{"raw_affiliation_string":"School of Computer Science, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Guangyu Zhu","orcid":"https://orcid.org/0009-0008-1467-1776"},"institutions":[{"id":"https://openalex.org/I21193070","display_name":"Beijing Jiaotong University","ror":"https://ror.org/01yj56c84","country_code":"CN","type":"education","lineage":["https://openalex.org/I21193070"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guangyu Zhu","raw_affiliation_strings":["Beijing Research Center of Urban Traffic Information Sensing and Service Technologies, Beijing Jiaotong University, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0008-1467-1776","affiliations":[{"raw_affiliation_string":"Beijing Research Center of Urban Traffic Information Sensing and Service Technologies, Beijing Jiaotong University, Beijing, China","institution_ids":["https://openalex.org/I21193070"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5110956301","display_name":"Edmond Q. Wu","orcid":"https://orcid.org/0000-0003-1301-9870"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Edmond Q. Wu","raw_affiliation_strings":["Department of Computer Science and Engineering, Shanghai Jiao Tong University, Shanghai, China","Shanghai Engineering Research Center of Intelligent Control and Management, Shanghai Jiao Tong University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0003-1301-9870","affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]},{"raw_affiliation_string":"Shanghai Engineering Research Center of Intelligent Control and Management, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.4375,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.57374793,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":98},"biblio":{"volume":"9","issue":"3","first_page":"4373","last_page":"4382"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9951000213623047,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10930","display_name":"Flood Risk Assessment and Management","score":0.9728999733924866,"subfield":{"id":"https://openalex.org/subfields/2306","display_name":"Global and Planetary Change"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.9341182708740234},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.777076780796051},{"id":"https://openalex.org/keywords/anticipation","display_name":"Anticipation (artificial intelligence)","score":0.654131293296814},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.4529721140861511},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.4314740002155304},{"id":"https://openalex.org/keywords/isolation","display_name":"Isolation (microbiology)","score":0.42984604835510254},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.42949971556663513},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.39410191774368286},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.39315134286880493},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.36483922600746155},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.33524182438850403},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.11733335256576538}],"concepts":[{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.9341182708740234},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.777076780796051},{"id":"https://openalex.org/C176777502","wikidata":"https://www.wikidata.org/wiki/Q4774623","display_name":"Anticipation (artificial intelligence)","level":2,"score":0.654131293296814},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.4529721140861511},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.4314740002155304},{"id":"https://openalex.org/C2775941552","wikidata":"https://www.wikidata.org/wiki/Q25212305","display_name":"Isolation (microbiology)","level":2,"score":0.42984604835510254},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.42949971556663513},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.39410191774368286},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.39315134286880493},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.36483922600746155},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.33524182438850403},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.11733335256576538},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C89423630","wikidata":"https://www.wikidata.org/wiki/Q7193","display_name":"Microbiology","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tiv.2024.3353172","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tiv.2024.3353172","pdf_url":null,"source":{"id":"https://openalex.org/S4210199657","display_name":"IEEE Transactions on Intelligent Vehicles","issn_l":"2379-8858","issn":["2379-8858","2379-8904"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Vehicles","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","id":"https://metadata.un.org/sdg/9","score":0.49000000953674316}],"awards":[{"id":"https://openalex.org/G241012663","display_name":null,"funder_award_id":"62171274","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8335343387","display_name":null,"funder_award_id":"U2241228","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8880411100","display_name":null,"funder_award_id":"62272036","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":43,"referenced_works":["https://openalex.org/W877909479","https://openalex.org/W1522734439","https://openalex.org/W1956340063","https://openalex.org/W2101105183","https://openalex.org/W2108325777","https://openalex.org/W2425121537","https://openalex.org/W2506483933","https://openalex.org/W2601686579","https://openalex.org/W2625940279","https://openalex.org/W2738136547","https://openalex.org/W2960747818","https://openalex.org/W2963302737","https://openalex.org/W2963482775","https://openalex.org/W2963916161","https://openalex.org/W2968863477","https://openalex.org/W2984862483","https://openalex.org/W3000432059","https://openalex.org/W3006320872","https://openalex.org/W3034426027","https://openalex.org/W3035392611","https://openalex.org/W3106534186","https://openalex.org/W3118497696","https://openalex.org/W3119777426","https://openalex.org/W3156501016","https://openalex.org/W3171688991","https://openalex.org/W3185716769","https://openalex.org/W4220790454","https://openalex.org/W4312550876","https://openalex.org/W4312560592","https://openalex.org/W4313598771","https://openalex.org/W4322730935","https://openalex.org/W4361029998","https://openalex.org/W4361030040","https://openalex.org/W4367280774","https://openalex.org/W4376166839","https://openalex.org/W4386066385","https://openalex.org/W4390572330","https://openalex.org/W6678262379","https://openalex.org/W6684090549","https://openalex.org/W6771217966","https://openalex.org/W6772619176","https://openalex.org/W6773737242","https://openalex.org/W6791353385"],"related_works":["https://openalex.org/W4210416330","https://openalex.org/W2775506363","https://openalex.org/W3088136942","https://openalex.org/W4290852288","https://openalex.org/W4310447809","https://openalex.org/W4200243030","https://openalex.org/W2800782462","https://openalex.org/W3209117276","https://openalex.org/W4388184981","https://openalex.org/W4323777661"],"abstract_inverted_index":{"Incorporating":[0],"visual":[1,54],"cues":[2,55],"to":[3,61,105,123,168,223],"anticipate":[4],"and":[5,84,131,142,154,183,238],"describe":[6],"future":[7,228],"events":[8,38],"holds":[9],"significant":[10,206],"promise":[11],"for":[12,48],"enhancing":[13],"user-friendly":[14,198],"early":[15,235],"warning":[16,236],"systems":[17,237],"in":[18,26,158,196,209],"emergency":[19,159,240],"response":[20,60,241],"scenarios.":[21],"However,":[22],"a":[23,66,94,102,118,138,164,178,205],"notable":[24],"limitation":[25],"existing":[27],"video":[28,95,103,112,129,144,172,210],"captioning":[29],"techniques":[30],"is":[31,78,117,137],"their":[32],"predominant":[33],"focus":[34],"on":[35,52],"describing":[36,217],"ongoing":[37],"within":[39],"observed":[40,53,111,141],"videos.":[41],"The":[42,89,114,134],"challenging":[43],"task":[44],"of":[45,101,150,181,187,193,221,227],"predicting":[46],"captions":[47],"unobserved":[49],"videos":[50],"based":[51],"remains":[56],"largely":[57],"unaddressed.":[58],"In":[59,146],"this":[62],"gap,":[63],"we":[64,161],"introduce":[65],"novel":[67],"neural":[68],"network":[69],"architecture":[70,83],"termed":[71],"the":[72,81,99,110,125,148,191,218,225],"Anticipation":[73],"Video":[74],"Captioning":[75],"Transformer,":[76],"which":[77,188],"built":[79],"upon":[80],"transformer":[82,104],"comprises":[85],"three":[86],"essential":[87],"modules.":[88],"first":[90],"module":[91,116,136],"serves":[92],"as":[93],"feature":[96],"extractor,":[97],"harnessing":[98],"capabilities":[100,214],"extract":[106],"spatiotemporal":[107],"features":[108],"from":[109],"data.":[113],"second":[115],"multimodal":[119],"mask":[120],"language":[121],"model":[122],"learn":[124],"intricate":[126],"correlations":[127],"between":[128],"content":[130],"corresponding":[132],"captions.":[133,145,200],"third":[135],"decoder,":[139],"generating":[140],"anticipation":[143,171,199,226],"assessing":[147],"efficacy":[149],"our":[151,194,202],"proposed":[152],"method":[153],"its":[155,213],"potential":[156],"applicability":[157],"scenarios,":[160],"have":[162],"developed":[163],"specialized":[165],"dataset":[166],"dedicated":[167],"aerial":[169],"refueling":[170],"captioning.":[173],"Our":[174],"experimental":[175],"evaluations":[176],"encompass":[177,224],"diverse":[179],"range":[180],"qualitative":[182],"quantitative":[184],"analyses,":[185],"all":[186],"consistently":[189],"demonstrate":[190],"effectiveness":[192],"approach":[195],"furnishing":[197],"Overall,":[201],"work":[203],"represents":[204],"step":[207],"forward":[208],"captioning,":[211],"extending":[212],"beyond":[215],"merely":[216],"present":[219],"state":[220],"affairs":[222],"events.":[229],"This":[230],"innovation":[231],"can":[232],"potentially":[233],"enhance":[234],"improve":[239],"procedures.":[242]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
