{"id":"https://openalex.org/W4379261329","doi":"https://doi.org/10.48550/arxiv.2306.00980","title":"SnapFusion: Text-to-Image Diffusion Model on Mobile Devices within Two Seconds","display_name":"SnapFusion: Text-to-Image Diffusion Model on Mobile Devices within Two Seconds","publication_year":2023,"publication_date":"2023-06-01","ids":{"openalex":"https://openalex.org/W4379261329","doi":"https://doi.org/10.48550/arxiv.2306.00980"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2306.00980","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2306.00980","pdf_url":"https://arxiv.org/pdf/2306.00980","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2306.00980","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5010773732","display_name":"Yanyu Li","orcid":"https://orcid.org/0000-0003-1240-4785"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Yanyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100331980","display_name":"Huan Wang","orcid":"https://orcid.org/0000-0001-6951-901X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Huan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030977862","display_name":"Qing Jin","orcid":"https://orcid.org/0000-0001-8795-9297"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jin, Qing","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101001123","display_name":"Hu Ju","orcid":"https://orcid.org/0009-0006-1260-9931"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Ju","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024781798","display_name":"Pavlo Chemerys","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chemerys, Pavlo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005819096","display_name":"Yun Fu","orcid":"https://orcid.org/0000-0002-5098-2853"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fu, Yun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100651384","display_name":"Yanzhi Wang","orcid":"https://orcid.org/0000-0002-3024-7990"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Yanzhi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058028206","display_name":"Sergey Tulyakov","orcid":"https://orcid.org/0000-0003-3465-1592"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tulyakov, Sergey","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5023189335","display_name":"Jian Ren","orcid":"https://orcid.org/0000-0002-1889-5661"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ren, Jian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":35,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.8945000171661377,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.8945000171661377,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.7888000011444092,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8124892711639404},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.5813650488853455},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5742413401603699},{"id":"https://openalex.org/keywords/mobile-device","display_name":"Mobile device","score":0.5218257308006287},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.5163030028343201},{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.4886832535266876},{"id":"https://openalex.org/keywords/regularization","display_name":"Regularization (linguistics)","score":0.4622608721256256},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.42771488428115845},{"id":"https://openalex.org/keywords/anisotropic-diffusion","display_name":"Anisotropic diffusion","score":0.4214032292366028},{"id":"https://openalex.org/keywords/deconvolution","display_name":"Deconvolution","score":0.4179912209510803},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.39698922634124756},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.34401506185531616},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.2958911061286926}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8124892711639404},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.5813650488853455},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5742413401603699},{"id":"https://openalex.org/C186967261","wikidata":"https://www.wikidata.org/wiki/Q5082128","display_name":"Mobile device","level":2,"score":0.5218257308006287},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.5163030028343201},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.4886832535266876},{"id":"https://openalex.org/C2776135515","wikidata":"https://www.wikidata.org/wiki/Q17143721","display_name":"Regularization (linguistics)","level":2,"score":0.4622608721256256},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.42771488428115845},{"id":"https://openalex.org/C203504353","wikidata":"https://www.wikidata.org/wiki/Q4765461","display_name":"Anisotropic diffusion","level":3,"score":0.4214032292366028},{"id":"https://openalex.org/C174576160","wikidata":"https://www.wikidata.org/wiki/Q1183700","display_name":"Deconvolution","level":2,"score":0.4179912209510803},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.39698922634124756},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.34401506185531616},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2958911061286926},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2306.00980","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2306.00980","pdf_url":"https://arxiv.org/pdf/2306.00980","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2306.00980","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2306.00980","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2306.00980","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2306.00980","pdf_url":"https://arxiv.org/pdf/2306.00980","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W3090782779","https://openalex.org/W4251527294","https://openalex.org/W2562325497","https://openalex.org/W2149396808","https://openalex.org/W2475096862","https://openalex.org/W2379232376","https://openalex.org/W3209466624","https://openalex.org/W1992788508","https://openalex.org/W2071165097","https://openalex.org/W2007919187"],"abstract_inverted_index":{"Text-to-image":[0],"diffusion":[1,54,92,190],"models":[2,22,55,93,191],"can":[3],"create":[4],"stunning":[5],"images":[6],"from":[7,152],"natural":[8],"language":[9],"descriptions":[10],"that":[11,161],"rival":[12],"the":[13,86,122,125,130,133,142,193],"work":[14,182],"of":[15,31,124,132,195],"professional":[16],"artists":[17],"and":[18,29,38,47,61,110,128,149,171],"photographers.":[19],"However,":[20],"these":[21,77],"are":[23,50],"large,":[24],"with":[25,164,178],"complex":[26],"network":[27,108],"architectures":[28],"tens":[30],"denoising":[32,166],"iterations,":[33],"making":[34],"them":[35],"computationally":[36],"expensive":[37],"slow":[39],"to":[40,52,71,192],"run.":[41],"As":[42],"a":[43,72,81],"result,":[44],"high-end":[45],"GPUs":[46],"cloud-based":[48],"inference":[49],"required":[51],"run":[53],"at":[56],"scale.":[57],"This":[58],"is":[59,69],"costly":[60],"has":[62],"privacy":[63],"implications,":[64],"especially":[65],"when":[66],"user":[67],"data":[68,137],"sent":[70],"third":[73],"party.":[74],"To":[75],"overcome":[76],"challenges,":[78],"we":[79,115,140],"present":[80],"generic":[82],"approach":[83],"that,":[84],"for":[85],"first":[87],"time,":[88],"unlocks":[89],"running":[90],"text-to-image":[91,189],"on":[94,158],"mobile":[95],"devices":[96],"in":[97],"less":[98],"than":[99,174],"$2$":[100],"seconds.":[101],"We":[102],"achieve":[103],"so":[104],"by":[105,120,145,186],"introducing":[106,150],"efficient":[107,118],"architecture":[109],"improving":[111],"step":[112,143],"distillation.":[113,138],"Specifically,":[114],"propose":[116],"an":[117],"UNet":[119],"identifying":[121],"redundancy":[123],"original":[126],"model":[127,163],"reducing":[129],"computation":[131],"image":[134],"decoder":[135],"via":[136],"Further,":[139],"enhance":[141],"distillation":[144],"exploring":[146],"training":[147],"strategies":[148],"regularization":[151],"classifier-free":[153],"guidance.":[154],"Our":[155,181],"extensive":[156],"experiments":[157],"MS-COCO":[159],"show":[160],"our":[162],"$8$":[165],"steps":[167],"achieves":[168],"better":[169],"FID":[170],"CLIP":[172],"scores":[173],"Stable":[175],"Diffusion":[176],"v$1.5$":[177],"$50$":[179],"steps.":[180],"democratizes":[183],"content":[184],"creation":[185],"bringing":[187],"powerful":[188],"hands":[194],"users.":[196]},"counts_by_year":[{"year":2025,"cited_by_count":12},{"year":2024,"cited_by_count":21},{"year":2023,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2023-06-04T00:00:00"}
