{"id":"https://openalex.org/W1996185082","doi":"https://doi.org/10.1109/vcip.2012.6410779","title":"Spatio-temporal ssim index for video quality assessment","display_name":"Spatio-temporal ssim index for video quality assessment","publication_year":2012,"publication_date":"2012-11-01","ids":{"openalex":"https://openalex.org/W1996185082","doi":"https://doi.org/10.1109/vcip.2012.6410779","mag":"1996185082"},"language":"en","primary_location":{"id":"doi:10.1109/vcip.2012.6410779","is_oa":false,"landing_page_url":"https://doi.org/10.1109/vcip.2012.6410779","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2012 Visual Communications and Image Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100372142","display_name":"Yue Wang","orcid":"https://orcid.org/0009-0006-4065-6735"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yue Wang","raw_affiliation_strings":["Graduate University of Chinese Academy of Sciences, Beijing, China","Graduate University of Chinese Academy of Sciences,  Beijing China"],"affiliations":[{"raw_affiliation_string":"Graduate University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"Graduate University of Chinese Academy of Sciences,  Beijing China","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101606698","display_name":"Tingting Jiang","orcid":"https://orcid.org/0000-0002-5372-0656"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tingting Jiang","raw_affiliation_strings":["National Engineering Lab for Video Technology, Peking University, Beijing, China","National Engineering Lab for Video Technology, Key Lab of Machine Perception(MoE), School of EECS, Peking University, Beijing, China#TAB#"],"affiliations":[{"raw_affiliation_string":"National Engineering Lab for Video Technology, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"National Engineering Lab for Video Technology, Key Lab of Machine Perception(MoE), School of EECS, Peking University, Beijing, China#TAB#","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039832462","display_name":"Siwei Ma","orcid":"https://orcid.org/0000-0002-2731-5403"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Siwei Ma","raw_affiliation_strings":["National Engineering Lab for Video Technology, Peking University, Beijing, China","National Engineering Lab for Video Technology, Key Lab of Machine Perception(MoE), School of EECS, Peking University, Beijing, China#TAB#"],"affiliations":[{"raw_affiliation_string":"National Engineering Lab for Video Technology, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"National Engineering Lab for Video Technology, Key Lab of Machine Perception(MoE), School of EECS, Peking University, Beijing, China#TAB#","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101523804","display_name":"Wen Gao","orcid":"https://orcid.org/0000-0001-8894-1806"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wen Gao","raw_affiliation_strings":["National Engineering Lab for Video Technology, Peking University, Beijing, China","National Engineering Lab for Video Technology, Key Lab of Machine Perception(MoE), School of EECS, Peking University, Beijing, China#TAB#"],"affiliations":[{"raw_affiliation_string":"National Engineering Lab for Video Technology, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"National Engineering Lab for Video Technology, Key Lab of Machine Perception(MoE), School of EECS, Peking University, Beijing, China#TAB#","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100372142"],"corresponding_institution_ids":["https://openalex.org/I19820366","https://openalex.org/I4210165038"],"apc_list":null,"apc_paid":null,"fwci":0.8236,"has_fulltext":false,"cited_by_count":10,"citation_normalized_percentile":{"value":0.73738827,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11165","display_name":"Image and Video Quality Assessment","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11165","display_name":"Image and Video Quality Assessment","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.9925000071525574,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11659","display_name":"Advanced Image Fusion Techniques","score":0.9919000267982483,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/distortion","display_name":"Distortion (music)","score":0.7754626870155334},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7509927749633789},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.7301682829856873},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6430990695953369},{"id":"https://openalex.org/keywords/video-quality","display_name":"Video quality","score":0.6307726502418518},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.5895993709564209},{"id":"https://openalex.org/keywords/pixel","display_name":"Pixel","score":0.5140141248703003},{"id":"https://openalex.org/keywords/human-visual-system-model","display_name":"Human visual system model","score":0.45379507541656494},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.4465647339820862},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4453662931919098},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4243740141391754},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3647570013999939},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.24234026670455933},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1607346534729004}],"concepts":[{"id":"https://openalex.org/C126780896","wikidata":"https://www.wikidata.org/wiki/Q899871","display_name":"Distortion (music)","level":4,"score":0.7754626870155334},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7509927749633789},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.7301682829856873},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6430990695953369},{"id":"https://openalex.org/C103910844","wikidata":"https://www.wikidata.org/wiki/Q2631256","display_name":"Video quality","level":3,"score":0.6307726502418518},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.5895993709564209},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.5140141248703003},{"id":"https://openalex.org/C160086991","wikidata":"https://www.wikidata.org/wiki/Q5939193","display_name":"Human visual system model","level":3,"score":0.45379507541656494},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.4465647339820862},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4453662931919098},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4243740141391754},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3647570013999939},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.24234026670455933},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1607346534729004},{"id":"https://openalex.org/C194257627","wikidata":"https://www.wikidata.org/wiki/Q211554","display_name":"Amplifier","level":3,"score":0.0},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/vcip.2012.6410779","is_oa":false,"landing_page_url":"https://doi.org/10.1109/vcip.2012.6410779","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2012 Visual Communications and Image Processing","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W1766596758","https://openalex.org/W1990977013","https://openalex.org/W2005664438","https://openalex.org/W2031912957","https://openalex.org/W2035379092","https://openalex.org/W2084999174","https://openalex.org/W2101144220","https://openalex.org/W2113032778","https://openalex.org/W2117535912","https://openalex.org/W2118877769","https://openalex.org/W2121809595","https://openalex.org/W2125654704","https://openalex.org/W2133665775","https://openalex.org/W2140332897","https://openalex.org/W2142825011","https://openalex.org/W2144764737","https://openalex.org/W2153777140","https://openalex.org/W2165222134","https://openalex.org/W6638151783","https://openalex.org/W6677548441"],"related_works":["https://openalex.org/W2337415362","https://openalex.org/W4312857205","https://openalex.org/W121273120","https://openalex.org/W2740820121","https://openalex.org/W317572212","https://openalex.org/W2002009170","https://openalex.org/W2034462085","https://openalex.org/W2038316300","https://openalex.org/W1996185082","https://openalex.org/W2545649598"],"abstract_inverted_index":{"An":[0],"ideal":[1],"objective":[2],"metric":[3],"for":[4],"video":[5,13,29,61,135],"quality":[6,62],"assessment":[7],"(VQA)":[8],"should":[9,40],"achieve":[10],"consistency":[11],"between":[12],"distortion":[14,36,39],"prediction":[15],"and":[16,24,37,80,93,97,117,127],"psychological":[17],"perception":[18],"of":[19,47,134],"human":[20],"visual":[21],"system":[22],"(HVS),":[23],"is":[25,121,128],"important":[26],"in":[27,44,70,76,90],"many":[28],"processing":[30],"applications.":[31],"In":[32,50],"general,":[33],"both":[34,77],"spatial":[35,78],"temporal":[38,81],"be":[41],"carefully":[42],"considered":[43],"the":[45,66],"designing":[46],"VQA":[48,125],"metrics.":[49],"this":[51],"paper,":[52],"we":[53,83],"propose":[54,84],"a":[55,114],"novel":[56],"spatio-temporal":[57,104],"structural":[58,87],"information":[59],"based":[60,101],"metric.":[63],"Motivated":[64],"by":[65],"fact":[67],"that":[68,112],"pixels":[69],"natural":[71],"videos":[72],"are":[73],"highly":[74],"structured":[75],"domain":[79],"domain,":[82],"to":[85,131],"perform":[86],"similarity":[88],"evaluation":[89],"x-y,":[91],"x-t":[92],"y-t":[94],"dimensions":[95],"respectively":[96],"pooled":[98],"them":[99],"adaptively":[100],"on":[102,108],"local":[103],"activities.":[105],"Experimental":[106],"results":[107],"LIVE":[109],"database":[110],"show":[111],"such":[113],"conceptually":[115],"simple":[116],"computationally":[118],"efficient":[119],"algorithm":[120],"competitive":[122],"with":[123],"state-of-the-art":[124],"metrics,":[126],"very":[129],"robust":[130],"various":[132],"types":[133],"distortions.":[136]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":1},{"year":2013,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
