{"id":"https://openalex.org/W7155046687","doi":"https://doi.org/10.48550/arxiv.2604.17074","title":"Comparison Drives Preference: Reference-Aware Modeling for AI-Generated Video Quality Assessment","display_name":"Comparison Drives Preference: Reference-Aware Modeling for AI-Generated Video Quality Assessment","publication_year":2026,"publication_date":"2026-04-18","ids":{"openalex":"https://openalex.org/W7155046687","doi":"https://doi.org/10.48550/arxiv.2604.17074"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.17074","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.17074","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.17074","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5022701174","display_name":"Minghao Zou","orcid":"https://orcid.org/0000-0002-0239-3990"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zou, Minghao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100610688","display_name":"Gen Liu","orcid":"https://orcid.org/0000-0001-9789-540X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Gen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134204689","display_name":"Guanghui Yue","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yue, Guanghui","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134188191","display_name":"Baoquan Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Baoquan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100356886","display_name":"Zhihua Wang","orcid":"https://orcid.org/0000-0002-7521-2900"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Zhihua","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134198791","display_name":"Paul L. Rosin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rosin, Paul L.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134104778","display_name":"Hantao Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Hantao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5134211696","display_name":"Wei Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Wei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11165","display_name":"Image and Video Quality Assessment","score":0.9916999936103821,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11165","display_name":"Image and Video Quality Assessment","score":0.9916999936103821,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.0034000000450760126,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.0007999999797903001,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/video-quality","display_name":"Video quality","score":0.6876000165939331},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.6510999798774719},{"id":"https://openalex.org/keywords/quality-assessment","display_name":"Quality assessment","score":0.6247000098228455},{"id":"https://openalex.org/keywords/quality-score","display_name":"Quality Score","score":0.5992000102996826},{"id":"https://openalex.org/keywords/subjective-video-quality","display_name":"Subjective video quality","score":0.5968000292778015},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.5781999826431274},{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.4959000051021576},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.4156000018119812}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7839999794960022},{"id":"https://openalex.org/C103910844","wikidata":"https://www.wikidata.org/wiki/Q2631256","display_name":"Video quality","level":3,"score":0.6876000165939331},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.6510999798774719},{"id":"https://openalex.org/C3020001037","wikidata":"https://www.wikidata.org/wiki/Q836575","display_name":"Quality assessment","level":3,"score":0.6247000098228455},{"id":"https://openalex.org/C2779346075","wikidata":"https://www.wikidata.org/wiki/Q7268763","display_name":"Quality Score","level":3,"score":0.5992000102996826},{"id":"https://openalex.org/C114227958","wikidata":"https://www.wikidata.org/wiki/Q7631422","display_name":"Subjective video quality","level":4,"score":0.5968000292778015},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.5781999826431274},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5216000080108643},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5041000247001648},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.4959000051021576},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.42649999260902405},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.4156000018119812},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.3898000121116638},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.3208000063896179},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.319599986076355},{"id":"https://openalex.org/C2984588014","wikidata":"https://www.wikidata.org/wiki/Q730675","display_name":"Quantitative assessment","level":2,"score":0.31700000166893005},{"id":"https://openalex.org/C20556612","wikidata":"https://www.wikidata.org/wiki/Q4469374","display_name":"Volume (thermodynamics)","level":2,"score":0.2962999939918518},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.29350000619888306},{"id":"https://openalex.org/C12426560","wikidata":"https://www.wikidata.org/wiki/Q189569","display_name":"Basis (linear algebra)","level":2,"score":0.2709999978542328},{"id":"https://openalex.org/C55020928","wikidata":"https://www.wikidata.org/wiki/Q3813865","display_name":"Image quality","level":3,"score":0.26579999923706055},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.262800008058548},{"id":"https://openalex.org/C3018395757","wikidata":"https://www.wikidata.org/wiki/Q1379672","display_name":"Evaluation methods","level":2,"score":0.26269999146461487},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.2623000144958496},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.25769999623298645}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.17074","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.17074","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.17074","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.17074","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0],"rapid":[1],"advancement":[2],"of":[3,12,20,156],"generative":[4],"models":[5],"has":[6],"led":[7],"to":[8,109,123,165],"a":[9,61,105],"growing":[10],"volume":[11],"AI-generated":[13,26],"videos,":[14,84],"making":[15],"the":[16,120,124,154,157],"automatic":[17],"quality":[18,29,36,68,141],"assessment":[19,30,69],"such":[21],"videos":[22],"increasingly":[23],"important.":[24],"Existing":[25],"content":[27],"video":[28,40,76],"(AIGC-VQA)":[31],"methods":[32,138],"typically":[33],"estimate":[34],"visual":[35],"by":[37,74,80,148],"analyzing":[38],"each":[39],"independently,":[41],"ignoring":[42],"potential":[43,164],"relationships":[44],"among":[45],"videos.":[46],"In":[47],"this":[48,66],"work,":[49],"we":[50,96],"revisit":[51],"AIGC-VQA":[52],"from":[53,119],"an":[54],"inter-video":[55],"perspective":[56],"and":[57,114,161],"formulate":[58],"it":[59],"as":[60],"reference-aware":[62],"evaluation":[63],"problem.":[64],"Through":[65],"formulation,":[67],"is":[70,86],"guided":[71],"not":[72],"only":[73],"intrinsic":[75],"characteristics":[77],"but":[78],"also":[79],"comparisons":[81],"with":[82,89,143],"related":[83,112],"which":[85,103],"more":[87],"consistent":[88],"human":[90],"perception.":[91],"To":[92],"validate":[93],"its":[94,163],"effectiveness,":[95],"propose":[97],"Reference-aware":[98],"Video":[99],"Quality":[100],"Assessment":[101],"(RefVQA),":[102],"utilizes":[104],"query-centered":[106],"reference":[107,121],"graph":[108],"organize":[110],"semantically":[111],"samples":[113],"performs":[115],"graph-guided":[116],"difference":[117],"aggregation":[118],"nodes":[122],"query":[125],"node.":[126],"Experiments":[127],"on":[128],"existing":[129],"datasets":[130],"demonstrate":[131],"that":[132],"our":[133],"proposed":[134,158],"RefVQA":[135],"outperforms":[136],"state-of-the-art":[137],"across":[139],"multiple":[140],"dimensions,":[142],"strong":[144],"generalization":[145],"ability":[146],"validated":[147],"cross-dataset":[149],"evaluation.":[150],"These":[151],"results":[152],"highlight":[153],"effectiveness":[155],"reference-based":[159],"formulation":[160],"suggest":[162],"advance":[166],"AIGC-VQA.":[167]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2026-04-22T00:00:00"}
