{"id":"https://openalex.org/W4400374120","doi":"https://doi.org/10.48550/arxiv.2407.02158","title":"UltraPixel: Advancing Ultra-High-Resolution Image Synthesis to New Peaks","display_name":"UltraPixel: Advancing Ultra-High-Resolution Image Synthesis to New Peaks","publication_year":2024,"publication_date":"2024-07-02","ids":{"openalex":"https://openalex.org/W4400374120","doi":"https://doi.org/10.48550/arxiv.2407.02158"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2407.02158","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2407.02158","pdf_url":"https://arxiv.org/pdf/2407.02158","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2407.02158","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5051565381","display_name":"Jingjing Ren","orcid":"https://orcid.org/0000-0002-6427-4364"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Ren, Jingjing","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100336572","display_name":"Wenbo Li","orcid":"https://orcid.org/0000-0002-0464-6955"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Wenbo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100763969","display_name":"Haoyu Chen","orcid":"https://orcid.org/0000-0001-7618-9733"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Haoyu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102960782","display_name":"Renjing Pei","orcid":"https://orcid.org/0000-0001-7513-6576"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pei, Renjing","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101518423","display_name":"Bin Shao","orcid":"https://orcid.org/0009-0000-2270-3258"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shao, Bin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102890595","display_name":"Yong Guo","orcid":"https://orcid.org/0000-0002-2599-6970"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guo, Yong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022583092","display_name":"Long Peng","orcid":"https://orcid.org/0000-0001-9654-953X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Peng, Long","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111938544","display_name":"Fenglong Song","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Song, Fenglong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5101342017","display_name":"Lei Zhu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhu, Lei","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5051565381"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13114","display_name":"Image Processing Techniques and Applications","score":0.9732999801635742,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13114","display_name":"Image Processing Techniques and Applications","score":0.9732999801635742,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12923","display_name":"Digital Image Processing Techniques","score":0.946399986743927,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.502507209777832},{"id":"https://openalex.org/keywords/high-resolution","display_name":"High resolution","score":0.4503065049648285},{"id":"https://openalex.org/keywords/resolution","display_name":"Resolution (logic)","score":0.4223792254924774},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.3566203713417053},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.28136956691741943},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.26892250776290894},{"id":"https://openalex.org/keywords/geology","display_name":"Geology","score":0.19494473934173584},{"id":"https://openalex.org/keywords/remote-sensing","display_name":"Remote sensing","score":0.18283849954605103}],"concepts":[{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.502507209777832},{"id":"https://openalex.org/C3020199158","wikidata":"https://www.wikidata.org/wiki/Q210521","display_name":"High resolution","level":2,"score":0.4503065049648285},{"id":"https://openalex.org/C138268822","wikidata":"https://www.wikidata.org/wiki/Q1051925","display_name":"Resolution (logic)","level":2,"score":0.4223792254924774},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.3566203713417053},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.28136956691741943},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.26892250776290894},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.19494473934173584},{"id":"https://openalex.org/C62649853","wikidata":"https://www.wikidata.org/wiki/Q199687","display_name":"Remote sensing","level":1,"score":0.18283849954605103}],"mesh":[],"locations_count":3,"locations":[{"id":"pmh:oai:arXiv.org:2407.02158","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2407.02158","pdf_url":"https://arxiv.org/pdf/2407.02158","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"pmh:oai:repository.hkust.edu.hk:1783.1-159751","is_oa":false,"landing_page_url":"http://repository.hkust.edu.hk/ir/Record/1783.1-159751","pdf_url":null,"source":{"id":"https://openalex.org/S4306401796","display_name":"Rare & Special e-Zone (The Hong Kong University of Science and Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I200769079","host_organization_name":"Hong Kong University of Science and Technology","host_organization_lineage":["https://openalex.org/I200769079"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Conference paper"},{"id":"doi:10.48550/arxiv.2407.02158","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2407.02158","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2407.02158","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2407.02158","pdf_url":"https://arxiv.org/pdf/2407.02158","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4212954839","https://openalex.org/W2056165575","https://openalex.org/W3190051883"],"abstract_inverted_index":{"Ultra-high-resolution":[0],"image":[1],"generation":[2,66],"poses":[3],"great":[4],"challenges,":[5],"such":[6],"as":[7],"increased":[8],"semantic":[9],"planning":[10],"complexity":[11],"and":[12,84,95,122,138],"detail":[13],"synthesis":[14],"difficulties,":[15],"alongside":[16],"substantial":[17],"training":[18,121,129],"resource":[19],"demands.":[20],"We":[21],"present":[22],"UltraPixel,":[23],"a":[24,43],"novel":[25],"architecture":[26],"utilizing":[27],"cascade":[28],"diffusion":[29],"models":[30],"to":[31,40,62,89],"generate":[32],"high-quality":[33],"images":[34,56,137],"at":[35],"multiple":[36],"resolutions":[37],"(\\textit{e.g.},":[38],"1K":[39],"6K)":[41],"within":[42],"single":[44],"model,":[45],"while":[46],"maintaining":[47],"computational":[48],"efficiency.":[49,124],"UltraPixel":[50],"leverages":[51],"semantics-rich":[52],"representations":[53,80],"of":[54,67,108],"lower-resolution":[55],"in":[57,100,142],"the":[58,64,101,106],"later":[59],"denoising":[60],"stage":[61],"guide":[63],"whole":[65],"highly":[68],"detailed":[69],"high-resolution":[70,96,117,136],"images,":[71],"significantly":[72],"reducing":[73],"complexity.":[74],"Furthermore,":[75],"we":[76],"introduce":[77],"implicit":[78],"neural":[79],"for":[81,116],"continuous":[82],"upsampling":[83],"scale-aware":[85],"normalization":[86],"layers":[87],"adaptable":[88],"various":[90],"resolutions.":[91],"Notably,":[92],"both":[93],"low-":[94],"processes":[97],"are":[98],"performed":[99],"most":[102],"compact":[103],"space,":[104],"sharing":[105],"majority":[107],"parameters":[109,115],"with":[110,130],"less":[111],"than":[112],"3$\\%$":[113],"additional":[114],"outputs,":[118],"largely":[119],"enhancing":[120],"inference":[123],"Our":[125],"model":[126],"achieves":[127],"fast":[128],"reduced":[131],"data":[132],"requirements,":[133],"producing":[134],"photo-realistic":[135],"demonstrating":[139],"state-of-the-art":[140],"performance":[141],"extensive":[143],"experiments.":[144]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
