{"id":"https://openalex.org/W4405033876","doi":"https://doi.org/10.48550/arxiv.2412.00878","title":"Beyond Pixels: Text Enhances Generalization in Real-World Image Restoration","display_name":"Beyond Pixels: Text Enhances Generalization in Real-World Image Restoration","publication_year":2024,"publication_date":"2024-12-01","ids":{"openalex":"https://openalex.org/W4405033876","doi":"https://doi.org/10.48550/arxiv.2412.00878"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2412.00878","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2412.00878","pdf_url":"https://arxiv.org/pdf/2412.00878","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2412.00878","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102777251","display_name":"Haoze Sun","orcid":"https://orcid.org/0000-0002-7037-701X"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Sun, Haoze","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100336571","display_name":"Wenbo Li","orcid":"https://orcid.org/0000-0002-0199-1534"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Wenbo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101829530","display_name":"Jiayue Liu","orcid":"https://orcid.org/0000-0001-9294-7493"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Jiayue","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001993403","display_name":"Kaiwen Zhou","orcid":"https://orcid.org/0000-0002-1943-0612"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Kaiwen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100611588","display_name":"Yongqiang Chen","orcid":"https://orcid.org/0000-0002-7578-3017"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Yongqiang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100754016","display_name":"Yong\u2010Xin Guo","orcid":"https://orcid.org/0000-0001-8842-5609"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guo, Yong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047385098","display_name":"Yan-Wei Li","orcid":"https://orcid.org/0000-0001-9011-3786"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Yanwei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102960782","display_name":"Renjing Pei","orcid":"https://orcid.org/0000-0001-7513-6576"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pei, Renjing","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021093477","display_name":"Long Peng","orcid":"https://orcid.org/0000-0003-4589-8064"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Peng, Long","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5020953714","display_name":"Yujiu Yang","orcid":"https://orcid.org/0000-0002-6427-1024"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Yujiu","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":10,"corresponding_author_ids":["https://openalex.org/A5102777251"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10052","display_name":"Medical Image Segmentation Techniques","score":0.8001999855041504,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10052","display_name":"Medical Image Segmentation Techniques","score":0.8001999855041504,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10522","display_name":"Medical Imaging Techniques and Applications","score":0.7730000019073486,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T12859","display_name":"Cell Image Analysis Techniques","score":0.7426000237464905,"subfield":{"id":"https://openalex.org/subfields/1304","display_name":"Biophysics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.7355743050575256},{"id":"https://openalex.org/keywords/pixel","display_name":"Pixel","score":0.6101014614105225},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.603969931602478},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.473811537027359},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4657040238380432},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.46151942014694214},{"id":"https://openalex.org/keywords/image-restoration","display_name":"Image restoration","score":0.460345059633255},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2787776589393616},{"id":"https://openalex.org/keywords/image-processing","display_name":"Image processing","score":0.1884405016899109},{"id":"https://openalex.org/keywords/mathematical-analysis","display_name":"Mathematical analysis","score":0.05208173394203186}],"concepts":[{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.7355743050575256},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.6101014614105225},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.603969931602478},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.473811537027359},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4657040238380432},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.46151942014694214},{"id":"https://openalex.org/C106430172","wikidata":"https://www.wikidata.org/wiki/Q6002272","display_name":"Image restoration","level":4,"score":0.460345059633255},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2787776589393616},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.1884405016899109},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.05208173394203186}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2412.00878","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2412.00878","pdf_url":"https://arxiv.org/pdf/2412.00878","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2412.00878","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2412.00878","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2412.00878","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2412.00878","pdf_url":"https://arxiv.org/pdf/2412.00878","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4405033876.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W3162204513","https://openalex.org/W3135697610","https://openalex.org/W2371138613","https://openalex.org/W2085033728","https://openalex.org/W4285411112","https://openalex.org/W2048963458","https://openalex.org/W1598401975","https://openalex.org/W2974904990","https://openalex.org/W2365681766","https://openalex.org/W2393963626"],"abstract_inverted_index":{"Generalization":[0],"has":[1],"long":[2],"been":[3],"a":[4,91,113],"central":[5],"challenge":[6],"in":[7,26],"real-world":[8,41,120],"image":[9,100],"restoration.":[10],"While":[11],"recent":[12],"diffusion-based":[13,133],"restoration":[14,134],"methods,":[15],"which":[16],"leverage":[17],"generative":[18,58],"priors":[19],"from":[20],"text-to-image":[21],"models,":[22,135],"have":[23],"made":[24],"progress":[25],"recovering":[27],"more":[28],"realistic":[29],"details,":[30],"they":[31],"still":[32],"encounter":[33],"\"generative":[34],"capability":[35],"deactivation\"":[36],"when":[37],"applied":[38],"to":[39,55,99,117],"out-of-distribution":[40],"data.":[42],"To":[43],"address":[44],"this,":[45],"we":[46,88,110],"propose":[47],"using":[48],"text":[49,71],"as":[50],"an":[51],"auxiliary":[52],"invariant":[53],"representation":[54],"reactivate":[56],"the":[57,129],"capabilities":[59],"of":[60,70,132],"these":[61,86],"models.":[62],"We":[63],"begin":[64],"by":[65],"identifying":[66],"two":[67],"key":[68],"properties":[69],"input:":[72],"richness":[73],"and":[74,76,102],"relevance,":[75],"examine":[77],"their":[78],"respective":[79],"influence":[80],"on":[81,85],"model":[82],"performance.":[83],"Building":[84],"insights,":[87],"introduce":[89],"Res-Captioner,":[90],"module":[92],"that":[93,125],"generates":[94],"enhanced":[95],"textual":[96],"descriptions":[97],"tailored":[98],"content":[101],"degradation":[103],"levels,":[104],"effectively":[105],"mitigating":[106],"response":[107],"failures.":[108],"Additionally,":[109],"present":[111],"RealIR,":[112],"new":[114],"benchmark":[115],"designed":[116],"capture":[118],"diverse":[119],"scenarios.":[121],"Extensive":[122],"experiments":[123],"demonstrate":[124],"Res-Captioner":[126],"significantly":[127],"enhances":[128],"generalization":[130],"abilities":[131],"while":[136],"remaining":[137],"fully":[138],"plug-and-play.":[139]},"counts_by_year":[],"updated_date":"2026-03-11T14:59:36.786465","created_date":"2024-12-05T00:00:00"}
