{"id":"https://openalex.org/W4415537505","doi":"https://doi.org/10.1145/3746027.3754839","title":"TimeChat-Online: 80% Visual Tokens are Naturally Redundant in Streaming Videos","display_name":"TimeChat-Online: 80% Visual Tokens are Naturally Redundant in Streaming Videos","publication_year":2025,"publication_date":"2025-10-25","ids":{"openalex":"https://openalex.org/W4415537505","doi":"https://doi.org/10.1145/3746027.3754839"},"language":null,"primary_location":{"id":"doi:10.1145/3746027.3754839","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3746027.3754839","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100599428","display_name":"Linli Yao","orcid":"https://orcid.org/0000-0002-9809-8864"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Linli Yao","raw_affiliation_strings":["Peking University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-9809-8864","affiliations":[{"raw_affiliation_string":"Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Yicheng Li","orcid":"https://orcid.org/0009-0005-5599-1504"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yicheng Li","raw_affiliation_strings":["Peking University, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0005-5599-1504","affiliations":[{"raw_affiliation_string":"Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037752195","display_name":"Yuancheng Wei","orcid":null},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuancheng Wei","raw_affiliation_strings":["South China University of Technology, Guangzhou, China"],"raw_orcid":"https://orcid.org/0009-0007-1576-3341","affiliations":[{"raw_affiliation_string":"South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Lei Li","orcid":"https://orcid.org/0009-0008-6984-5104"},"institutions":[{"id":"https://openalex.org/I889458895","display_name":"University of Hong Kong","ror":"https://ror.org/02zhqgq86","country_code":"HK","type":"education","lineage":["https://openalex.org/I889458895"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Lei Li","raw_affiliation_strings":["University of Hong Kong, Hong Kong, China"],"raw_orcid":"https://orcid.org/0009-0008-6984-5104","affiliations":[{"raw_affiliation_string":"University of Hong Kong, Hong Kong, China","institution_ids":["https://openalex.org/I889458895"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101030723","display_name":"Shuhuai Ren","orcid":"https://orcid.org/0009-0001-9998-864X"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuhuai Ren","raw_affiliation_strings":["Peking University, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0001-9998-864X","affiliations":[{"raw_affiliation_string":"Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Yuanxin Liu","orcid":"https://orcid.org/0009-0000-7218-4011"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuanxin Liu","raw_affiliation_strings":["Peking University, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0000-7218-4011","affiliations":[{"raw_affiliation_string":"Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109515733","display_name":"Kun Ouyang","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kun Ouyang","raw_affiliation_strings":["Peking University, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0008-5788-9126","affiliations":[{"raw_affiliation_string":"Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034611488","display_name":"Lean Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lean Wang","raw_affiliation_strings":["Peking University, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0000-7676-8065","affiliations":[{"raw_affiliation_string":"Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100723941","display_name":"Shicheng Li","orcid":"https://orcid.org/0000-0002-5724-0641"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shicheng Li","raw_affiliation_strings":["Peking University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-5724-0641","affiliations":[{"raw_affiliation_string":"Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018158797","display_name":"LI Si-da","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Sida Li","raw_affiliation_strings":["Peking University, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0001-7994-8050","affiliations":[{"raw_affiliation_string":"Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014554970","display_name":"Lingpeng Kong","orcid":"https://orcid.org/0000-0002-9033-2724"},"institutions":[{"id":"https://openalex.org/I889458895","display_name":"University of Hong Kong","ror":"https://ror.org/02zhqgq86","country_code":"HK","type":"education","lineage":["https://openalex.org/I889458895"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Lingpeng Kong","raw_affiliation_strings":["University of Hong Kong, Hong Kong, China"],"raw_orcid":"https://orcid.org/0000-0002-9033-2724","affiliations":[{"raw_affiliation_string":"University of Hong Kong, Hong Kong, China","institution_ids":["https://openalex.org/I889458895"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5092188471","display_name":"Qi Liu","orcid":"https://orcid.org/0000-0003-4608-5778"},"institutions":[{"id":"https://openalex.org/I889458895","display_name":"University of Hong Kong","ror":"https://ror.org/02zhqgq86","country_code":"HK","type":"education","lineage":["https://openalex.org/I889458895"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Qi Liu","raw_affiliation_strings":["University of Hong Kong, Hong Kong, China"],"raw_orcid":"https://orcid.org/0000-0003-4608-5778","affiliations":[{"raw_affiliation_string":"University of Hong Kong, Hong Kong, China","institution_ids":["https://openalex.org/I889458895"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020022791","display_name":"Yuanxing Zhang","orcid":"https://orcid.org/0000-0003-1460-8124"},"institutions":[{"id":"https://openalex.org/I4210108109","display_name":"Beijing Enterprises (China)","ror":"https://ror.org/01egb4878","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210108109"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuanxing Zhang","raw_affiliation_strings":["Kling Team, Kuaishou, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-1460-8124","affiliations":[{"raw_affiliation_string":"Kling Team, Kuaishou, Beijing, China","institution_ids":["https://openalex.org/I4210108109"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101441137","display_name":"Xu Sun","orcid":"https://orcid.org/0000-0001-8241-9320"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xu Sun","raw_affiliation_strings":["Peking University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-8241-9320","affiliations":[{"raw_affiliation_string":"Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":14,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":4.2561,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.94922447,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"10807","last_page":"10816"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9937999844551086,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12720","display_name":"Multimedia Communication and Technology","score":0.9854000210762024,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.6639000177383423},{"id":"https://openalex.org/keywords/redundancy","display_name":"Redundancy (engineering)","score":0.6571000218391418},{"id":"https://openalex.org/keywords/video-processing","display_name":"Video processing","score":0.5475999712944031},{"id":"https://openalex.org/keywords/video-tracking","display_name":"Video tracking","score":0.444599986076355},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.43160000443458557},{"id":"https://openalex.org/keywords/video-streaming","display_name":"Video streaming","score":0.33250001072883606},{"id":"https://openalex.org/keywords/video-compression-picture-types","display_name":"Video compression picture types","score":0.3287999927997589},{"id":"https://openalex.org/keywords/video-editing","display_name":"Video editing","score":0.3253999948501587}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8600000143051147},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.6639000177383423},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.6571000218391418},{"id":"https://openalex.org/C65483669","wikidata":"https://www.wikidata.org/wiki/Q3536669","display_name":"Video processing","level":2,"score":0.5475999712944031},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.444599986076355},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.43160000443458557},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.35510000586509705},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.33719998598098755},{"id":"https://openalex.org/C2986160907","wikidata":"https://www.wikidata.org/wiki/Q220499","display_name":"Video streaming","level":2,"score":0.33250001072883606},{"id":"https://openalex.org/C106030495","wikidata":"https://www.wikidata.org/wiki/Q1797012","display_name":"Video compression picture types","level":4,"score":0.3287999927997589},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.32749998569488525},{"id":"https://openalex.org/C2780310081","wikidata":"https://www.wikidata.org/wiki/Q1154312","display_name":"Video editing","level":2,"score":0.3253999948501587},{"id":"https://openalex.org/C160086991","wikidata":"https://www.wikidata.org/wiki/Q5939193","display_name":"Human visual system model","level":3,"score":0.3249000012874603},{"id":"https://openalex.org/C151211776","wikidata":"https://www.wikidata.org/wiki/Q2778015","display_name":"Video capture","level":3,"score":0.32269999384880066},{"id":"https://openalex.org/C94124525","wikidata":"https://www.wikidata.org/wiki/Q912550","display_name":"Categorization","level":2,"score":0.3222000002861023},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.31349998712539673},{"id":"https://openalex.org/C117090137","wikidata":"https://www.wikidata.org/wiki/Q7927977","display_name":"Video post-processing","level":5,"score":0.3100999891757965},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3010999858379364},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.30079999566078186},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.2994999885559082},{"id":"https://openalex.org/C2988167200","wikidata":"https://www.wikidata.org/wiki/Q16885149","display_name":"Online video","level":2,"score":0.29910001158714294},{"id":"https://openalex.org/C103910844","wikidata":"https://www.wikidata.org/wiki/Q2631256","display_name":"Video quality","level":3,"score":0.2978000044822693},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.2897000014781952},{"id":"https://openalex.org/C2777851325","wikidata":"https://www.wikidata.org/wiki/Q7094102","display_name":"Online model","level":2,"score":0.27639999985694885},{"id":"https://openalex.org/C179518139","wikidata":"https://www.wikidata.org/wiki/Q5140297","display_name":"Coding (social sciences)","level":2,"score":0.2646999955177307},{"id":"https://openalex.org/C128840427","wikidata":"https://www.wikidata.org/wiki/Q1302174","display_name":"Motion compensation","level":2,"score":0.25429999828338623}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3746027.3754839","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3746027.3754839","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G963605737","display_name":null,"funder_award_id":"92470205, 62176002","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":9,"referenced_works":["https://openalex.org/W2165533158","https://openalex.org/W4213285154","https://openalex.org/W4389519587","https://openalex.org/W4402702917","https://openalex.org/W4402727885","https://openalex.org/W4402754220","https://openalex.org/W4403939369","https://openalex.org/W4405561007","https://openalex.org/W4413146710"],"related_works":[],"abstract_inverted_index":{"The":[0],"rapid":[1],"growth":[2],"of":[3,97,148,194,250],"online":[4,74],"video":[5,18,26,79,136,172,195,225,255],"platforms,":[6],"particularly":[7],"live":[8],"streaming":[9,57,101,152,171,214],"services,":[10],"has":[11],"created":[12],"an":[13,132],"urgent":[14],"need":[15],"for":[16,37],"real-time":[17,78,164],"understanding":[19],"systems.":[20],"These":[21],"systems":[22],"must":[23],"process":[24],"continuous":[25,192],"streams":[27],"and":[28,181,217,219,230],"respond":[29],"to":[30,60,63],"user":[31],"queries":[32],"instantaneously,":[33],"presenting":[34],"unique":[35,185],"challenges":[36],"current":[38],"Video":[39],"Large":[40],"Language":[41],"Models":[42],"(VideoLLMs).":[43],"While":[44],"existing":[45],"VideoLLMs":[46],"excel":[47],"at":[48],"processing":[49],"complete":[50],"videos,":[51],"they":[52],"face":[53],"significant":[54],"limitations":[55],"in":[56,100,135,151],"scenarios":[58],"due":[59],"their":[61],"inability":[62],"handle":[64],"dense,":[65],"redundant":[66,121,156],"frames":[67],"efficiently.":[68],"We":[69],"introduce":[70],"TimeChat-Online,":[71],"a":[72,169,239],"novel":[73],"VideoLLM":[75],"that":[76,129,145],"revolutionizes":[77],"interaction.":[80],"At":[81],"its":[82],"core":[83],"lies":[84],"our":[85,126],"innovative":[86],"Differential":[87],"Token":[88],"Drop":[89],"(DTD)":[90],"module,":[91],"which":[92],"addresses":[93],"the":[94,244],"fundamental":[95],"challenge":[96],"visual":[98,107,149],"redundancy":[99],"videos.":[102],"Drawing":[103],"inspiration":[104],"from":[105,203],"human":[106],"perception's":[108],"Change":[109],"Blindness":[110],"phenomenon,":[111],"DTD":[112,130,237],"preserves":[113],"meaningful":[114],"temporal":[115],"changes":[116],"while":[117,138,253],"filtering":[118],"out":[119],"static,":[120],"content":[122,150],"between":[123],"frames.":[124],"Remarkably,":[125],"experiments":[127],"demonstrate":[128],"achieves":[131,238],"82.8%":[133],"reduction":[134],"tokens":[137,256],"maintaining":[139,220],"98%":[140],"performance":[141,212],"on":[142,213,223,243],"StreamingBench,":[143],"revealing":[144],"over":[146],"80%":[147],"videos":[153,249],"is":[154],"naturally":[155,189],"without":[157],"requiring":[158],"language":[159],"guidance.":[160],"To":[161],"enable":[162],"seamless":[163],"interaction,":[165],"we":[166],"present":[167],"TimeChat-Online-139K,":[168],"comprehensive":[170],"dataset":[173],"featuring":[174],"diverse":[175],"interaction":[176],"patterns":[177],"including":[178],"backward-tracing,":[179],"current-perception,":[180],"future-responding":[182],"scenarios.":[183],"TimeChat-Online's":[184,210],"Proactive":[186],"Response":[187],"capability,":[188],"achieved":[190],"through":[191],"monitoring":[193],"scene":[196],"transitions":[197],"via":[198],"DTD,":[199],"sets":[200],"it":[201],"apart":[202],"conventional":[204],"approaches.":[205],"Our":[206],"extensive":[207],"evaluation":[208],"demonstrates":[209],"superior":[211],"benchmarks":[215],"(StreamingBench":[216],"OvOBench)":[218],"competitive":[221],"results":[222],"long-form":[224],"tasks":[226],"such":[227],"as":[228],"Video-MME":[229],"MLVU.":[231],"Notably,":[232],"when":[233],"integrated":[234],"with":[235],"Qwen2.5VL-7B,":[236],"5.7-point":[240],"accuracy":[241],"improvement":[242],"challenging":[245],"VideoMME":[246],"subset":[247],"containing":[248],"30-60":[251],"minutes,":[252],"reducing":[254],"by":[257],"84.6%.":[258],"Project":[259],"page:":[260],"https://timechat-online.github.io.":[261]},"counts_by_year":[{"year":2025,"cited_by_count":4}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-25T00:00:00"}
