{"id":"https://openalex.org/W4407693483","doi":"https://doi.org/10.1109/tmm.2025.3543087","title":"Viewport Prediction With Unsupervised Multiscale Causal Representation Learning for Virtual Reality Video Streaming","display_name":"Viewport Prediction With Unsupervised Multiscale Causal Representation Learning for Virtual Reality Video Streaming","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4407693483","doi":"https://doi.org/10.1109/tmm.2025.3543087"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2025.3543087","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2025.3543087","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100384090","display_name":"Yingjie Liu","orcid":"https://orcid.org/0000-0003-3835-6048"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yingjie Liu","raw_affiliation_strings":["State Key Laboratory of Integrated Services Networks, Xidian University, Xi&#x0027;an, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Integrated Services Networks, Xidian University, Xi&#x0027;an, China","institution_ids":["https://openalex.org/I149594827"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100411782","display_name":"Dan Wang","orcid":"https://orcid.org/0000-0001-9302-3233"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dan Wang","raw_affiliation_strings":["State Key Laboratory of Integrated Services Networks, Xidian University, Xi&#x0027;an, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Integrated Services Networks, Xidian University, Xi&#x0027;an, China","institution_ids":["https://openalex.org/I149594827"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5035560190","display_name":"Bin Song","orcid":"https://orcid.org/0000-0002-8096-3370"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bin Song","raw_affiliation_strings":["State Key Laboratory of Integrated Services Networks, Xidian University, Xi&#x0027;an, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Integrated Services Networks, Xidian University, Xi&#x0027;an, China","institution_ids":["https://openalex.org/I149594827"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100384090"],"corresponding_institution_ids":["https://openalex.org/I149594827"],"apc_list":null,"apc_paid":null,"fwci":3.6542,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.91939956,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":"27","issue":null,"first_page":"4752","last_page":"4764"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11165","display_name":"Image and Video Quality Assessment","score":0.9936000108718872,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11165","display_name":"Image and Video Quality Assessment","score":0.9936000108718872,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.911899983882904,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.9038000106811523,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/viewport","display_name":"Viewport","score":0.9123005270957947},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8702694177627563},{"id":"https://openalex.org/keywords/virtual-reality","display_name":"Virtual reality","score":0.6957241892814636},{"id":"https://openalex.org/keywords/video-streaming","display_name":"Video streaming","score":0.4847104549407959},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.47982048988342285},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4052257537841797},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.3544950485229492},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.33355259895324707},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.3245598077774048},{"id":"https://openalex.org/keywords/real-time-computing","display_name":"Real-time computing","score":0.12846127152442932}],"concepts":[{"id":"https://openalex.org/C2778090530","wikidata":"https://www.wikidata.org/wiki/Q2523931","display_name":"Viewport","level":2,"score":0.9123005270957947},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8702694177627563},{"id":"https://openalex.org/C194969405","wikidata":"https://www.wikidata.org/wiki/Q170519","display_name":"Virtual reality","level":2,"score":0.6957241892814636},{"id":"https://openalex.org/C2986160907","wikidata":"https://www.wikidata.org/wiki/Q220499","display_name":"Video streaming","level":2,"score":0.4847104549407959},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.47982048988342285},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4052257537841797},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.3544950485229492},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.33355259895324707},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.3245598077774048},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.12846127152442932},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2025.3543087","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2025.3543087","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4406704326","display_name":null,"funder_award_id":"62201419","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8160288408","display_name":null,"funder_award_id":"62372357","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":44,"referenced_works":["https://openalex.org/W2585813514","https://openalex.org/W2620871200","https://openalex.org/W2622637199","https://openalex.org/W2798428896","https://openalex.org/W2895957446","https://openalex.org/W2896449077","https://openalex.org/W2896840651","https://openalex.org/W2897460799","https://openalex.org/W2951881930","https://openalex.org/W2964942120","https://openalex.org/W2971025576","https://openalex.org/W2996939355","https://openalex.org/W3020127778","https://openalex.org/W3030482512","https://openalex.org/W3094338163","https://openalex.org/W3119121492","https://openalex.org/W3136920339","https://openalex.org/W3141438256","https://openalex.org/W3173329356","https://openalex.org/W3195342827","https://openalex.org/W3205285744","https://openalex.org/W4210795263","https://openalex.org/W4220991980","https://openalex.org/W4221086736","https://openalex.org/W4221098881","https://openalex.org/W4221129962","https://openalex.org/W4226225860","https://openalex.org/W4243538177","https://openalex.org/W4251137679","https://openalex.org/W4281653211","https://openalex.org/W4285606598","https://openalex.org/W4293057496","https://openalex.org/W4293794975","https://openalex.org/W4294643390","https://openalex.org/W4308233970","https://openalex.org/W4309157242","https://openalex.org/W4313412899","https://openalex.org/W4317796966","https://openalex.org/W4383316158","https://openalex.org/W4386074714","https://openalex.org/W4386159889","https://openalex.org/W4387148495","https://openalex.org/W4387741824","https://openalex.org/W4390481616"],"related_works":["https://openalex.org/W4389095575","https://openalex.org/W2908978341","https://openalex.org/W4294975495","https://openalex.org/W2992753629","https://openalex.org/W3161069372","https://openalex.org/W3171203216","https://openalex.org/W2953145693","https://openalex.org/W4400649593","https://openalex.org/W4403863317","https://openalex.org/W2765219117"],"abstract_inverted_index":{"The":[0,170,199,301],"rise":[1],"of":[2,10,25,112,123,258,265,274,282,307],"the":[3,7,28,82,121,129,180,215,228,231,235,239,242,250,255,263,266,271,275,280,291,294,305,308],"metaverse":[4],"has":[5],"driven":[6],"rapid":[8],"development":[9],"various":[11],"applications,":[12],"such":[13],"as":[14],"Virtual":[15],"Reality":[16,20],"(VR)":[17],"and":[18,38,76,91,125,139,164,219],"Augmented":[19],"(AR).":[21],"As":[22],"a":[23,50,175,297],"form":[24],"multimedia":[26],"in":[27,81,85,157,189,223,234,241,293],"metaverse,":[29],"VR":[30,34,60,79,158],"video":[31,36,44,61,80,113,126,159,165,191,224,259],"streaming":[32,37,78],"(a.k.a.,":[33],"spherical":[35],"360<inline-formula":[39,51],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[40,52],"xmlns:xlink=\"http://www.w3.org/1999/xlink\"><tex-math":[41,53],"notation=\"LaTeX\">$^{\\circ":[42,54],"}$</tex-math></inline-formula>":[43,55],"streaming)":[45],"can":[46,87],"provide":[47],"users":[48,124,283],"with":[49],"immersive":[56],"experience.":[57],"Generally,":[58],"transmitting":[59],"requires":[62],"far":[63],"more":[64],"bandwidth":[65,89],"than":[66],"regular":[67],"videos,":[68],"which":[69],"greatly":[70],"strains":[71],"existing":[72,95],"network":[73],"transmission.":[74],"Predicting":[75],"selectively":[77],"users'":[83,182,196,251,276],"viewports":[84,106,156,183,188],"advance":[86],"reduce":[88],"consumption":[90],"system":[92],"latency.":[93],"However,":[94],"methods":[96,103],"either":[97],"consider":[98],"only":[99],"historical":[100,187],"viewport-based":[101],"prediction":[102,141,168,273],"or":[104],"predict":[105,155,179],"by":[107,174,286],"correlations":[108,132],"between":[109,133,217],"visual":[110,134,221],"features":[111,135,222],"frames,":[114,225],"making":[115],"it":[116],"hard":[117],"to":[118,120,137,154,178,193,195,213,254,290],"adapt":[119,194],"dynamics":[122],"content.":[127,260],"In":[128,278],"meantime,":[130],"spurious":[131],"lead":[136],"inaccurate":[138],"unreliable":[140],"results.":[142],"Hence,":[143],"we":[144],"propose":[145],"an":[146,208],"unsupervised":[147,202],"multiscale":[148,203],"causal":[149,204,210,246],"representation":[150,205],"learning":[151,206],"(UMCRL)-based":[152],"method":[153],"streaming,":[160],"including":[161],"user":[162],"preference-based":[163],"content-based":[166],"viewport":[167,295],"models.":[169],"former":[171],"is":[172,284],"designed":[173],"position":[176],"predictor":[177],"future":[181],"based":[184],"on":[185],"their":[186],"multiple":[190],"frames":[192],"dynamic":[197,256],"preferences.":[198],"latter":[200],"achieves":[201],"through":[207,296],"asymmetric":[209],"regressor,":[211],"used":[212],"infer":[214],"causalities":[216,240],"local":[218],"global-local":[220],"thereby":[226],"helping":[227],"model":[229],"understand":[230],"contextual":[232],"information":[233],"videos.":[236],"We":[237],"embed":[238],"transformer":[243],"decoder":[244],"via":[245],"self-attention":[247],"for":[248],"predicting":[249],"viewports,":[252],"adapting":[253],"changes":[257],"Finally,":[261],"combining":[262],"results":[264,303],"two":[267],"aforementioned":[268],"models":[269],"yields":[270],"final":[272],"viewports.":[277],"addition,":[279],"QoE":[281],"satisfied":[285],"assigning":[287],"different":[288],"bitrates":[289],"tiles":[292],"pyramid-based":[298],"bitrate":[299],"allocation.":[300],"experimental":[302],"verify":[304],"effectiveness":[306],"method.":[309]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
