{"id":"https://openalex.org/W4320007076","doi":"https://doi.org/10.48550/arxiv.2204.10485","title":"Attentions Help CNNs See Better: Attention-based Hybrid Image Quality Assessment Network","display_name":"Attentions Help CNNs See Better: Attention-based Hybrid Image Quality Assessment Network","publication_year":2022,"publication_date":"2022-04-22","ids":{"openalex":"https://openalex.org/W4320007076","doi":"https://doi.org/10.48550/arxiv.2204.10485"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2204.10485","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2204.10485","pdf_url":"https://arxiv.org/pdf/2204.10485","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2204.10485","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5086678836","display_name":"Shanshan Lao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lao, Shanshan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101858855","display_name":"Yuan Gong","orcid":"https://orcid.org/0009-0009-9097-4805"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gong, Yuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086329538","display_name":"Shuwei Shi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shi, Shuwei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113174783","display_name":"Sidi Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Sidi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063972231","display_name":"Tianhe Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Tianhe","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100329218","display_name":"Jiahao Wang","orcid":"https://orcid.org/0009-0005-9125-2629"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Jiahao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028709578","display_name":"Weihao Xia","orcid":"https://orcid.org/0000-0003-0087-3525"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xia, Weihao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5020953714","display_name":"Yujiu Yang","orcid":"https://orcid.org/0000-0002-6427-1024"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Yujiu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11165","display_name":"Image and Video Quality Assessment","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11165","display_name":"Image and Video Quality Assessment","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11659","display_name":"Advanced Image Fusion Techniques","score":0.9955000281333923,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.9878000020980835,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7753771543502808},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7042340040206909},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.6787800192832947},{"id":"https://openalex.org/keywords/image-quality","display_name":"Image quality","score":0.5485339164733887},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5101421475410461},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.4405609369277954},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.43716707825660706},{"id":"https://openalex.org/keywords/preprocessor","display_name":"Preprocessor","score":0.4179893732070923},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.4030023217201233},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.36403077840805054},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.33192458748817444}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7753771543502808},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7042340040206909},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.6787800192832947},{"id":"https://openalex.org/C55020928","wikidata":"https://www.wikidata.org/wiki/Q3813865","display_name":"Image quality","level":3,"score":0.5485339164733887},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5101421475410461},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.4405609369277954},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.43716707825660706},{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.4179893732070923},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.4030023217201233},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.36403077840805054},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.33192458748817444},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2204.10485","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2204.10485","pdf_url":"https://arxiv.org/pdf/2204.10485","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},{"id":"doi:10.48550/arxiv.2204.10485","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2204.10485","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2204.10485","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2204.10485","pdf_url":"https://arxiv.org/pdf/2204.10485","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3931585407","display_name":null,"funder_award_id":"U1903213","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4320007076.pdf","grobid_xml":"https://content.openalex.org/works/W4320007076.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4293226380","https://openalex.org/W2397288865","https://openalex.org/W4321487865","https://openalex.org/W4313906399","https://openalex.org/W2368524271","https://openalex.org/W4247116873","https://openalex.org/W4391266461","https://openalex.org/W2095030957","https://openalex.org/W2066827917","https://openalex.org/W2884201223"],"abstract_inverted_index":{"Image":[0,79,210],"quality":[1],"assessment":[2],"(IQA)":[3],"algorithm":[4],"aims":[5],"to":[6,60,84,175],"quantify":[7],"the":[8,22,45,87,94,140,148,158,164,177,187,200,206],"human":[9],"perception":[10],"of":[11,47,160,205],"image":[12,56,71,127],"quality.":[13],"Unfortunately,":[14],"there":[15],"is":[16,155],"a":[17,101,105,111,152,170],"performance":[18,92],"drop":[19],"when":[20],"assessing":[21],"distortion":[23],"images":[24],"generated":[25],"by":[26,130],"generative":[27],"adversarial":[28],"network":[29,114],"(GAN)":[30],"with":[31,86,157],"seemingly":[32],"realistic":[33],"texture.":[34],"In":[35],"this":[36,41],"work,":[37],"we":[38,74,99,168],"conjecture":[39],"that":[40,183],"maladaptation":[42],"lies":[43],"in":[44],"backbone":[46],"IQA":[48,96,193],"models,":[49],"where":[50],"patch-level":[51],"prediction":[52,173],"methods":[53,189],"use":[54,169],"independent":[55],"patches":[57,128],"as":[58],"input":[59],"calculate":[61],"their":[62],"scores":[63],"separately,":[64],"but":[65],"lack":[66],"spatial":[67],"relationship":[68],"modeling":[69],"among":[70,126],"patches.":[72],"Therefore,":[73],"propose":[75],"an":[76],"Attention-based":[77],"Hybrid":[78],"Quality":[80,211],"Assessment":[81,212],"Network":[82],"(AHIQ)":[83],"deal":[85],"challenge":[88],"and":[89,110,132,195],"get":[90],"better":[91],"on":[93,147,190,199],"GAN-based":[95],"task.":[97],"Firstly,":[98],"adopt":[100],"two-branch":[102],"architecture,":[103],"including":[104],"vision":[106],"transformer":[107],"(ViT)":[108],"branch":[109,116],"convolutional":[112],"neural":[113],"(CNN)":[115],"for":[117],"feature":[118],"extraction.":[119],"The":[120,180],"hybrid":[121],"architecture":[122],"combines":[123],"interaction":[124],"information":[125,162],"captured":[129],"ViT":[131,165],"local":[133],"texture":[134],"details":[135],"from":[136,142,163],"CNN.":[137],"To":[138],"make":[139],"features":[141],"shallow":[143],"CNN":[144],"more":[145],"focused":[146],"visually":[149],"salient":[150],"region,":[151],"deformable":[153],"convolution":[154],"applied":[156],"help":[159],"semantic":[161],"branch.":[166],"Finally,":[167],"patch-wise":[171],"score":[172],"module":[174],"obtain":[176],"final":[178],"score.":[179],"experiments":[181],"show":[182],"our":[184],"model":[185],"outperforms":[186],"state-of-the-art":[188],"four":[191],"standard":[192],"datasets":[194],"AHIQ":[196],"ranked":[197],"first":[198],"Full":[201],"Reference":[202],"(FR)":[203],"track":[204],"NTIRE":[207],"2022":[208],"Perceptual":[209],"Challenge.":[213]},"counts_by_year":[{"year":2023,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
