{"id":"https://openalex.org/W4414856469","doi":"https://doi.org/10.1109/tmm.2025.3618555","title":"CLIP-SR: Collaborative Linguistic and Image Processing for Super-Resolution","display_name":"CLIP-SR: Collaborative Linguistic and Image Processing for Super-Resolution","publication_year":2025,"publication_date":"2025-10-06","ids":{"openalex":"https://openalex.org/W4414856469","doi":"https://doi.org/10.1109/tmm.2025.3618555"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2025.3618555","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2025.3618555","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5026892941","display_name":"Bingwen Hu","orcid":"https://orcid.org/0000-0003-4890-1775"},"institutions":[{"id":"https://openalex.org/I92178344","display_name":"Anhui University of Technology","ror":"https://ror.org/02qdtrq21","country_code":"CN","type":"education","lineage":["https://openalex.org/I92178344"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Bingwen Hu","raw_affiliation_strings":["School of Computer Science and Technology, Anhui University of Technology, Ma&#x2019;anshan, China","School of Computer Science and Technology, Anhui University of Technology, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Anhui University of Technology, Ma&#x2019;anshan, China","institution_ids":["https://openalex.org/I92178344"]},{"raw_affiliation_string":"School of Computer Science and Technology, Anhui University of Technology, China","institution_ids":["https://openalex.org/I92178344"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Heng Liu","orcid":"https://orcid.org/0000-0001-7563-2676"},"institutions":[{"id":"https://openalex.org/I92178344","display_name":"Anhui University of Technology","ror":"https://ror.org/02qdtrq21","country_code":"CN","type":"education","lineage":["https://openalex.org/I92178344"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Heng Liu","raw_affiliation_strings":["School of Computer Science and Technology, Anhui University of Technology, Ma&#x2019;anshan, China","School of Computer Science and Technology, Anhui University of Technology, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Anhui University of Technology, Ma&#x2019;anshan, China","institution_ids":["https://openalex.org/I92178344"]},{"raw_affiliation_string":"School of Computer Science and Technology, Anhui University of Technology, China","institution_ids":["https://openalex.org/I92178344"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034162160","display_name":"Zhedong Zheng","orcid":"https://orcid.org/0000-0002-2434-9050"},"institutions":[{"id":"https://openalex.org/I204512498","display_name":"University of Macau","ror":"https://ror.org/01r4q9n85","country_code":"MO","type":"education","lineage":["https://openalex.org/I204512498"]}],"countries":["MO"],"is_corresponding":false,"raw_author_name":"Zhedong Zheng","raw_affiliation_strings":["Faculty of Science and Technology, and Institute of Collaborative Innovation, University of Macau, Macau, China","FST and ICI, University of Macau, China"],"affiliations":[{"raw_affiliation_string":"Faculty of Science and Technology, and Institute of Collaborative Innovation, University of Macau, Macau, China","institution_ids":["https://openalex.org/I204512498"]},{"raw_affiliation_string":"FST and ICI, University of Macau, China","institution_ids":["https://openalex.org/I204512498"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100442358","display_name":"Ping Liu","orcid":"https://orcid.org/0000-0002-3170-3783"},"institutions":[{"id":"https://openalex.org/I134113660","display_name":"University of Nevada, Reno","ror":"https://ror.org/01keh0577","country_code":"US","type":"education","lineage":["https://openalex.org/I134113660"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ping Liu","raw_affiliation_strings":["Department of Computer Science and Engineering, University of Nevada, Reno, NV, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, University of Nevada, Reno, NV, USA","institution_ids":["https://openalex.org/I134113660"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5026892941"],"corresponding_institution_ids":["https://openalex.org/I92178344"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.26508973,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"28","issue":null,"first_page":"17","last_page":"28"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.9842000007629395,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.9842000007629395,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10522","display_name":"Medical Imaging Techniques and Applications","score":0.9746999740600586,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10052","display_name":"Medical Image Segmentation Techniques","score":0.9509999752044678,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.6177999973297119},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.616100013256073},{"id":"https://openalex.org/keywords/upsampling","display_name":"Upsampling","score":0.5796999931335449},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.5633999705314636},{"id":"https://openalex.org/keywords/block","display_name":"Block (permutation group theory)","score":0.4047999978065491},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4027000069618225},{"id":"https://openalex.org/keywords/image-processing","display_name":"Image processing","score":0.38989999890327454},{"id":"https://openalex.org/keywords/scaling","display_name":"Scaling","score":0.3785000145435333},{"id":"https://openalex.org/keywords/semantic-memory","display_name":"Semantic memory","score":0.3424000144004822}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8723000288009644},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.6177999973297119},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.616100013256073},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5830000042915344},{"id":"https://openalex.org/C110384440","wikidata":"https://www.wikidata.org/wiki/Q1143270","display_name":"Upsampling","level":3,"score":0.5796999931335449},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.5633999705314636},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5184000134468079},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.4047999978065491},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4027000069618225},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.38989999890327454},{"id":"https://openalex.org/C99844830","wikidata":"https://www.wikidata.org/wiki/Q102441924","display_name":"Scaling","level":2,"score":0.3785000145435333},{"id":"https://openalex.org/C197914299","wikidata":"https://www.wikidata.org/wiki/Q18650","display_name":"Semantic memory","level":3,"score":0.3424000144004822},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3402000069618225},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.3379000127315521},{"id":"https://openalex.org/C202708506","wikidata":"https://www.wikidata.org/wiki/Q7449050","display_name":"Semantic compression","level":5,"score":0.3253999948501587},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.3221000134944916},{"id":"https://openalex.org/C19768560","wikidata":"https://www.wikidata.org/wiki/Q320727","display_name":"Dependency (UML)","level":2,"score":0.2953000068664551},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.2937000095844269},{"id":"https://openalex.org/C511149849","wikidata":"https://www.wikidata.org/wiki/Q7449051","display_name":"Semantic computing","level":3,"score":0.2856000065803528},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.2842999994754791},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.28110000491142273},{"id":"https://openalex.org/C2781122975","wikidata":"https://www.wikidata.org/wiki/Q16928266","display_name":"Semantic feature","level":2,"score":0.26440000534057617},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.25949999690055847},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.25870001316070557},{"id":"https://openalex.org/C141379421","wikidata":"https://www.wikidata.org/wiki/Q6094427","display_name":"Iterative reconstruction","level":2,"score":0.257099986076355},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2565999925136566}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2025.3618555","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2025.3618555","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4224502398","display_name":null,"funder_award_id":"2025A1515012281","funder_id":"https://openalex.org/F4320337111","funder_display_name":"Basic and Applied Basic Research Foundation of Guangdong Province"},{"id":"https://openalex.org/G840937704","display_name":null,"funder_award_id":"61971004","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320337111","display_name":"Basic and Applied Basic Research Foundation of Guangdong Province","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":61,"referenced_works":["https://openalex.org/W1861492603","https://openalex.org/W1885185971","https://openalex.org/W2133665775","https://openalex.org/W2209359034","https://openalex.org/W2214802144","https://openalex.org/W2242218935","https://openalex.org/W2476548250","https://openalex.org/W2866634454","https://openalex.org/W2883996939","https://openalex.org/W2887695188","https://openalex.org/W2919046835","https://openalex.org/W2950689937","https://openalex.org/W2952773607","https://openalex.org/W2963372104","https://openalex.org/W2963470893","https://openalex.org/W2963583792","https://openalex.org/W2963676087","https://openalex.org/W2963743395","https://openalex.org/W2963814095","https://openalex.org/W2963966654","https://openalex.org/W2964024144","https://openalex.org/W2964060609","https://openalex.org/W2964313012","https://openalex.org/W2966792645","https://openalex.org/W3005460778","https://openalex.org/W3013170474","https://openalex.org/W3033835243","https://openalex.org/W3035022492","https://openalex.org/W3035067471","https://openalex.org/W3035316078","https://openalex.org/W3035557850","https://openalex.org/W3035605421","https://openalex.org/W3035661604","https://openalex.org/W3110726019","https://openalex.org/W3167297682","https://openalex.org/W3173435145","https://openalex.org/W3180391059","https://openalex.org/W3189480530","https://openalex.org/W3193508667","https://openalex.org/W3216156094","https://openalex.org/W4304091752","https://openalex.org/W4312438583","https://openalex.org/W4312502087","https://openalex.org/W4312651322","https://openalex.org/W4312931308","https://openalex.org/W4312933868","https://openalex.org/W4312977351","https://openalex.org/W4367721896","https://openalex.org/W4378573568","https://openalex.org/W4386065752","https://openalex.org/W4387449209","https://openalex.org/W4387969466","https://openalex.org/W4390872856","https://openalex.org/W4390873054","https://openalex.org/W4391884092","https://openalex.org/W4392607678","https://openalex.org/W4392824670","https://openalex.org/W4393148714","https://openalex.org/W4402727836","https://openalex.org/W4402781400","https://openalex.org/W4403947068"],"related_works":[],"abstract_inverted_index":{"Convolutional":[0],"Neural":[1],"Networks":[2],"(CNNs)":[3],"have":[4],"significantly":[5],"advanced":[6],"Image":[7],"Super-Resolution":[8],"(SR),":[9],"yet":[10],"most":[11],"CNN-based":[12],"methods":[13],"rely":[14],"solely":[15],"on":[16],"pixel-based":[17],"transformations,":[18],"often":[19],"leading":[20],"to":[21,45,99,141],"artifacts":[22],"and":[23,84,118,130,158,170],"blurring,":[24],"particularly":[25],"under":[26],"severe":[27],"downsampling":[28],"rates":[29],"(<italic":[30],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[31],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">e.g.</i>,":[32],"8\u00d7":[33],"or":[34],"16\u00d7).":[35],"The":[36,113],"recently":[37],"developed":[38],"text-guided":[39],"SR":[40,98],"approaches":[41],"leverage":[42],"textual":[43,75,182],"descriptions":[44],"enhance":[46],"their":[47],"detail":[48,85],"restoration":[49],"capabilities":[50],"but":[51],"frequently":[52],"struggle":[53],"with":[54,77,106,147,155],"effectively":[55,80],"performing":[56],"alignment,":[57],"resulting":[58],"in":[59,87],"semantic":[60,70,82,160,198],"inconsistencies.":[61],"To":[62],"address":[63],"these":[64],"challenges,":[65],"we":[66],"propose":[67],"a":[68,107,143,187],"multi-modal":[69],"enhancement":[71,145],"framework":[72,114],"that":[73],"integrates":[74,115],"semantics":[76],"visual":[78],"features,":[79],"mitigating":[81],"mismatches":[83],"losses":[86],"highly":[88],"degraded":[89],"low-resolution":[90],"(LR)":[91],"images.":[92],"Our":[93],"method":[94,185],"enables":[95],"realistic,":[96],"high-quality":[97],"be":[100],"performed":[101],"at":[102,163],"large":[103],"upscaling":[104],"factors,":[105],"maximum":[108],"scaling":[109,165],"ratio":[110],"of":[111,176,189],"16\u00d7.":[112],"both":[116],"text":[117],"image":[119],"inputs":[120],"using":[121],"the":[122,125,131,174],"prompt":[123],"predictor,":[124],"Text-Image":[126],"Fusion":[127],"Block":[128],"(TIFBlock),":[129],"Iterative":[132],"Refinement":[133],"Module,":[134],"leveraging":[135,181],"Contrastive":[136],"Language-Image":[137],"Pretraining":[138],"(CLIP)":[139],"features":[140],"guide":[142],"progressive":[144],"process":[146],"fine-grained":[148],"alignment.":[149],"This":[150],"synergy":[151],"produces":[152],"high-resolution":[153],"outputs":[154],"sharp":[156],"textures":[157],"strong":[159],"coherence,":[161],"even":[162],"substantial":[164],"factors.":[166],"Extensive":[167],"comparative":[168],"experiments":[169],"ablation":[171],"studies":[172],"validate":[173],"effectiveness":[175],"our":[177,184],"approach.":[178],"Furthermore,":[179],"by":[180],"semantics,":[183],"offers":[186],"degree":[188],"super-resolution":[190],"editability,":[191],"allowing":[192],"for":[193],"controlled":[194],"enhancements":[195],"while":[196],"preserving":[197],"consistency.":[199]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
