{"id":"https://openalex.org/W2981411942","doi":"https://doi.org/10.1145/3343031.3351060","title":"Watch It Twice","display_name":"Watch It Twice","publication_year":2019,"publication_date":"2019-10-15","ids":{"openalex":"https://openalex.org/W2981411942","doi":"https://doi.org/10.1145/3343031.3351060","mag":"2981411942"},"language":"en","primary_location":{"id":"doi:10.1145/3343031.3351060","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3343031.3351060","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 27th ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5053572530","display_name":"Xiangxi Shi","orcid":null},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":true,"raw_author_name":"Xiangxi Shi","raw_affiliation_strings":["Nanyang Technological University, Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"Nanyang Technological University, Singapore, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100635804","display_name":"Jianfei Cai","orcid":"https://orcid.org/0000-0002-9444-3763"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Jianfei Cai","raw_affiliation_strings":["Nanyang Technological University &amp; Monash University, Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"Nanyang Technological University &amp; Monash University, Singapore, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005443526","display_name":"Shafiq Joty","orcid":"https://orcid.org/0000-0002-9222-2641"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Shafiq Joty","raw_affiliation_strings":["Nanyang Technological University, Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"Nanyang Technological University, Singapore, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5005119482","display_name":"Jiuxiang Gu","orcid":"https://orcid.org/0000-0002-3437-5084"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Jiuxiang Gu","raw_affiliation_strings":["Nanyang Technological University, Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"Nanyang Technological University, Singapore, Singapore","institution_ids":["https://openalex.org/I172675005"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5053572530"],"corresponding_institution_ids":["https://openalex.org/I172675005"],"apc_list":null,"apc_paid":null,"fwci":1.9232,"has_fulltext":false,"cited_by_count":26,"citation_normalized_percentile":{"value":0.8933312,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"818","last_page":"826"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.8726968765258789},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8567465543746948},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.7144638299942017},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.6193572878837585},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5382769703865051},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5248218178749084},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.4877348840236664},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4867849051952362},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.4402093291282654},{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.43947482109069824},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.4267148971557617},{"id":"https://openalex.org/keywords/video-processing","display_name":"Video processing","score":0.42598438262939453},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.41471827030181885},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.07925128936767578}],"concepts":[{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.8726968765258789},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8567465543746948},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.7144638299942017},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.6193572878837585},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5382769703865051},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5248218178749084},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.4877348840236664},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4867849051952362},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.4402093291282654},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.43947482109069824},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.4267148971557617},{"id":"https://openalex.org/C65483669","wikidata":"https://www.wikidata.org/wiki/Q3536669","display_name":"Video processing","level":2,"score":0.42598438262939453},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.41471827030181885},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.07925128936767578},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3343031.3351060","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3343031.3351060","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 27th ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7599999904632568,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W1522734439","https://openalex.org/W1586939924","https://openalex.org/W1956340063","https://openalex.org/W2064675550","https://openalex.org/W2133459682","https://openalex.org/W2139501017","https://openalex.org/W2142900973","https://openalex.org/W2157331557","https://openalex.org/W2163605009","https://openalex.org/W2194775991","https://openalex.org/W2425121537","https://openalex.org/W2526050071","https://openalex.org/W2554906389","https://openalex.org/W2557264465","https://openalex.org/W2560346187","https://openalex.org/W2575842049","https://openalex.org/W2607119937","https://openalex.org/W2745461083","https://openalex.org/W2798725893","https://openalex.org/W2807834696","https://openalex.org/W2890531016","https://openalex.org/W2895715183","https://openalex.org/W2895845501","https://openalex.org/W2899879331","https://openalex.org/W2950096400","https://openalex.org/W2962681491","https://openalex.org/W2962937869","https://openalex.org/W2962994439","https://openalex.org/W2963048642","https://openalex.org/W2963084599","https://openalex.org/W2963177403","https://openalex.org/W2963552819","https://openalex.org/W2963971014","https://openalex.org/W2964137974","https://openalex.org/W2992478697","https://openalex.org/W3098682680"],"related_works":["https://openalex.org/W2547835662","https://openalex.org/W4320858200","https://openalex.org/W2364498972","https://openalex.org/W1967750896","https://openalex.org/W2340102850","https://openalex.org/W1504288058","https://openalex.org/W4365441642","https://openalex.org/W2249304068","https://openalex.org/W4308238081","https://openalex.org/W2990667865"],"abstract_inverted_index":{"With":[0],"the":[1,8,52,67,72,86,90,94,131,140,156,160,180,195],"rapid":[2],"growth":[3],"of":[4,11,32,96,162,175,194],"video":[5,18,25,45,75,121,132,141,177],"data":[6],"and":[7,20,38,64,92,124,158,178],"increasing":[9],"demands":[10],"various":[12],"crossmodal":[13],"applications":[14],"such":[15],"as":[16],"intelligent":[17],"search":[19],"assistance":[21],"towards":[22],"visually-impaired":[23],"people,":[24],"captioning":[26,46,133],"task":[27],"has":[28],"received":[29],"a":[30,97,118,125,144,163,176],"lot":[31],"attention":[33],"recently":[34],"in":[35,111],"computer":[36],"vision":[37],"natural":[39],"language":[40],"processing":[41],"fields.":[42],"The":[43,135,165],"state-of-the-art":[44],"methods":[47],"focus":[48],"more":[49,183],"on":[50,187],"encoding":[51,122,137],"temporal":[53,62,83,151],"information,":[54,84],"while":[55],"lacking":[56],"effective":[57],"ways":[58],"to":[59,107,148],"remove":[60],"irrelevant":[61,82,87,150],"information":[63,88,152,171],"also":[65],"neglecting":[66],"spatial":[68,103,128,167,170],"details.":[69],"In":[70,99,113],"particular,":[71],"current":[73],"unidirectional":[74],"encoder":[76],"can":[77],"be":[78],"negatively":[79],"affected":[80],"by":[81],"especially":[85],"at":[89,93,155,159],"beginning":[91,157],"end":[95,161],"video.":[98,164],"addition,":[100],"disregarding":[101],"detailed":[102,184],"features":[104,168],"may":[105],"lead":[106],"incorrect":[108],"word":[109],"choices":[110],"decoding.":[112],"this":[114],"paper,":[115],"we":[116],"propose":[117],"novel":[119,126,166],"recurrent":[120,136],"method":[123],"visual":[127],"feature":[129],"for":[130],"task.":[134],"module":[138],"encodes":[139],"twice":[142],"with":[143,182],"predicted":[145],"key":[146],"frame":[147],"avoid":[149],"often":[153],"occurring":[154],"represent":[169],"from":[172],"different":[173],"regions":[174],"provide":[179],"decoder":[181],"information.":[185],"Experiments":[186],"two":[188],"benchmark":[189],"datasets":[190],"show":[191],"superior":[192],"performance":[193],"proposed":[196],"method.":[197]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":7},{"year":2021,"cited_by_count":7},{"year":2020,"cited_by_count":5}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2019-11-01T00:00:00"}
