{"id":"https://openalex.org/W7117120983","doi":"https://doi.org/10.1109/tpami.2025.3647857","title":"You Only Look One Step: Accelerating Backpropagation in Diffusion Sampling With Gradient Shortcuts","display_name":"You Only Look One Step: Accelerating Backpropagation in Diffusion Sampling With Gradient Shortcuts","publication_year":2025,"publication_date":"2025-12-24","ids":{"openalex":"https://openalex.org/W7117120983","doi":"https://doi.org/10.1109/tpami.2025.3647857","pmid":"https://pubmed.ncbi.nlm.nih.gov/41442305"},"language":"en","primary_location":{"id":"doi:10.1109/tpami.2025.3647857","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2025.3647857","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5032456103","display_name":"Hongkun Dou","orcid":"https://orcid.org/0000-0001-6185-5369"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Hongkun Dou","raw_affiliation_strings":["School of Astronautics, Beihang University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-6185-5369","affiliations":[{"raw_affiliation_string":"School of Astronautics, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Zeyu Li","orcid":"https://orcid.org/0000-0002-8693-0334"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zeyu Li","raw_affiliation_strings":["School of Astronautics, Beihang University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-8693-0334","affiliations":[{"raw_affiliation_string":"School of Astronautics, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Xingyu Jiang","orcid":"https://orcid.org/0009-0006-0282-622X"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xingyu Jiang","raw_affiliation_strings":["School of Astronautics, Beihang University, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0006-0282-622X","affiliations":[{"raw_affiliation_string":"School of Astronautics, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121182849","display_name":"Hongjue Li","orcid":null},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongjue Li","raw_affiliation_strings":["School of Astronautics, Beihang University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-0504-2555","affiliations":[{"raw_affiliation_string":"School of Astronautics, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121234073","display_name":"Lijun Yang","orcid":null},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lijun Yang","raw_affiliation_strings":["School of Astronautics, Beihang University, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Astronautics, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121234969","display_name":"Wen Yao","orcid":null},"institutions":[{"id":"https://openalex.org/I4210160531","display_name":"Chinese People's Liberation Army","ror":"https://ror.org/05tf9r976","country_code":"CN","type":"funder","lineage":["https://openalex.org/I4210160531"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wen Yao","raw_affiliation_strings":["Defense Innovation Institute, Chinese Academy of Military Science, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-5224-9834","affiliations":[{"raw_affiliation_string":"Defense Innovation Institute, Chinese Academy of Military Science, Beijing, China","institution_ids":["https://openalex.org/I4210160531"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5121135020","display_name":"Yue Deng","orcid":null},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yue Deng","raw_affiliation_strings":["Institute of Artificial Intelligence, Beihang University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-2871-8922","affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5032456103"],"corresponding_institution_ids":["https://openalex.org/I82880672"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.6658609,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"48","issue":"5","first_page":"5050","last_page":"5067"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11304","display_name":"Advanced Neuroimaging Techniques and Applications","score":0.5335000157356262,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T11304","display_name":"Advanced Neuroimaging Techniques and Applications","score":0.5335000157356262,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.21619999408721924,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.026799999177455902,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/backpropagation","display_name":"Backpropagation","score":0.8253999948501587},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5389999747276306},{"id":"https://openalex.org/keywords/differentiable-function","display_name":"Differentiable function","score":0.5062000155448914},{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.4765999913215637},{"id":"https://openalex.org/keywords/diffusion-process","display_name":"Diffusion process","score":0.4438000023365021},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.43140000104904175},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.4180000126361847},{"id":"https://openalex.org/keywords/sampling","display_name":"Sampling (signal processing)","score":0.4117000102996826},{"id":"https://openalex.org/keywords/diffusion","display_name":"Diffusion","score":0.39899998903274536}],"concepts":[{"id":"https://openalex.org/C155032097","wikidata":"https://www.wikidata.org/wiki/Q798503","display_name":"Backpropagation","level":3,"score":0.8253999948501587},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7630000114440918},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5389999747276306},{"id":"https://openalex.org/C202615002","wikidata":"https://www.wikidata.org/wiki/Q783507","display_name":"Differentiable function","level":2,"score":0.5062000155448914},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.47749999165534973},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.4765999913215637},{"id":"https://openalex.org/C68710425","wikidata":"https://www.wikidata.org/wiki/Q5275442","display_name":"Diffusion process","level":3,"score":0.4438000023365021},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.43140000104904175},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.41909998655319214},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.4180000126361847},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.4117000102996826},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.39899998903274536},{"id":"https://openalex.org/C27458966","wikidata":"https://www.wikidata.org/wiki/Q1187693","display_name":"Control flow graph","level":2,"score":0.3492000102996826},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2962000072002411},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.29429998993873596},{"id":"https://openalex.org/C115680565","wikidata":"https://www.wikidata.org/wiki/Q5977448","display_name":"Gradient method","level":2,"score":0.29260000586509705},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.29030001163482666},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.2856999933719635},{"id":"https://openalex.org/C88230418","wikidata":"https://www.wikidata.org/wiki/Q131476","display_name":"Graph theory","level":2,"score":0.28529998660087585},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.2797999978065491},{"id":"https://openalex.org/C133512626","wikidata":"https://www.wikidata.org/wiki/Q787371","display_name":"Automatic differentiation","level":3,"score":0.27790001034736633},{"id":"https://openalex.org/C2781395549","wikidata":"https://www.wikidata.org/wiki/Q4680762","display_name":"Adaptive sampling","level":3,"score":0.27709999680519104},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.27630001306533813},{"id":"https://openalex.org/C153258448","wikidata":"https://www.wikidata.org/wiki/Q1199743","display_name":"Gradient descent","level":3,"score":0.2700999975204468},{"id":"https://openalex.org/C8272713","wikidata":"https://www.wikidata.org/wiki/Q176737","display_name":"Stochastic process","level":2,"score":0.2646999955177307},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.2623000144958496},{"id":"https://openalex.org/C104267543","wikidata":"https://www.wikidata.org/wiki/Q208163","display_name":"Signal processing","level":3,"score":0.26159998774528503},{"id":"https://openalex.org/C73301696","wikidata":"https://www.wikidata.org/wiki/Q5469984","display_name":"Formalism (music)","level":3,"score":0.25679999589920044},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.25619998574256897},{"id":"https://openalex.org/C137836250","wikidata":"https://www.wikidata.org/wiki/Q984063","display_name":"Optimization problem","level":2,"score":0.25450000166893005},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.25270000100135803},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.25110000371932983}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tpami.2025.3647857","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2025.3647857","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},{"id":"pmid:41442305","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/41442305","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on pattern analysis and machine intelligence","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4613763696","display_name":null,"funder_award_id":"62031001","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G645526940","display_name":null,"funder_award_id":"62325101","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6644097784","display_name":null,"funder_award_id":"62405014","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Diffusion":[0,123],"models":[1],"(DMs)":[2],"have":[3],"recently":[4],"demonstrated":[5],"remarkable":[6],"success":[7],"in":[8,53,138],"modeling":[9],"large-scale":[10],"data":[11],"distributions.":[12],"However,":[13],"many":[14],"downstream":[15,93],"tasks":[16],"require":[17],"guiding":[18],"the":[19,31,72,75,86,100,143,159],"generated":[20],"content":[21],"based":[22],"on":[23,147],"specific":[24],"differentiable":[25],"metrics,":[26],"typically":[27],"necessitating":[28],"backpropagation":[29,84],"during":[30,107],"generation":[32,88,153],"process.":[33],"This":[34],"approach":[35,170],"is":[36,90,126,182],"computationally":[37,130],"expensive,":[38],"as":[39],"generating":[40],"with":[41],"DMs":[42,160],"often":[43],"demands":[44],"tens":[45],"to":[46,166],"hundreds":[47],"of":[48,77,103,133,145],"recursive":[49],"network":[50,163],"calls,":[51],"resulting":[52,117],"high":[54],"memory":[55],"usage":[56],"and":[57,129,157],"significant":[58],"time":[59],"consumption.":[60],"In":[61],"this":[62],"paper,":[63],"we":[64,120],"propose":[65],"a":[66,111],"more":[67],"efficient":[68],"alternative":[69],"that":[70,82],"approaches":[71],"problem":[73],"from":[74],"perspective":[76],"parallel":[78],"denoising.":[79],"We":[80,141],"show":[81],"full":[83,167],"throughout":[85],"entire":[87],"process":[89],"unnecessary.":[91],"The":[92,116],"metrics":[94],"can":[95],"be":[96],"optimized":[97],"by":[98,154,161,174],"retaining":[99],"computational":[101,172],"graph":[102],"only":[104],"one":[105],"step":[106],"generation,":[108],"thus":[109],"providing":[110],"shortcut":[112],"for":[113],"gradient":[114],"propagation.":[115],"method,":[118],"which":[119],"call":[121],"Shortcut":[122],"Optimization":[124],"(SDO),":[125],"generic,":[127],"high-performance,":[128],"lightweight,":[131],"capable":[132],"optimizing":[134,155],"all":[135],"parameter":[136],"types":[137],"diffusion":[139],"sampling.":[140],"demonstrate":[142],"effectiveness":[144],"SDO":[146],"several":[148],"real-world":[149],"tasks,":[150],"including":[151],"controlling":[152],"latent":[156],"aligning":[158],"fine-tuning":[162],"parameters.":[164],"Compared":[165],"backpropagation,":[168],"our":[169],"reduces":[171],"costs":[173],"$\\sim\\!":[175],"90\\%$\u223c90%":[176],"while":[177],"maintaining":[178],"superior":[179],"performance.":[180],"Code":[181],"available":[183],"at":[184],"https://github.com/deng-ai-lab/SDO.":[185]},"counts_by_year":[],"updated_date":"2026-04-04T06:10:10.580331","created_date":"2025-12-24T00:00:00"}
