{"id":"https://openalex.org/W7125903471","doi":"https://doi.org/10.1145/3774934.3786418","title":"ParDiff: Efficiently Parallelizing Reverse-Mode Automatic Differentiation with Direct Indexing","display_name":"ParDiff: Efficiently Parallelizing Reverse-Mode Automatic Differentiation with Direct Indexing","publication_year":2026,"publication_date":"2026-01-28","ids":{"openalex":"https://openalex.org/W7125903471","doi":"https://doi.org/10.1145/3774934.3786418"},"language":null,"primary_location":{"id":"doi:10.1145/3774934.3786418","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3774934.3786418","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 31st ACM SIGPLAN Annual Symposium on Principles and Practice of Parallel Programming","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5124067592","display_name":"Shuhong Huang","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Shuhong Huang","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0005-9442-7375","affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023681514","display_name":"Shizhi Tang","orcid":"https://orcid.org/0000-0002-6543-0859"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shizhi Tang","raw_affiliation_strings":["Qingcheng.AI, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-6543-0859","affiliations":[{"raw_affiliation_string":"Qingcheng.AI, Beijing, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048534698","display_name":"Yuan Wen","orcid":"https://orcid.org/0000-0002-6747-947X"},"institutions":[{"id":"https://openalex.org/I195460627","display_name":"University of Aberdeen","ror":"https://ror.org/016476m91","country_code":"GB","type":"education","lineage":["https://openalex.org/I195460627"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Yuan Wen","raw_affiliation_strings":["University of Aberdeen, Aberdeen, United Kingdom"],"raw_orcid":"https://orcid.org/0000-0002-6747-947X","affiliations":[{"raw_affiliation_string":"University of Aberdeen, Aberdeen, United Kingdom","institution_ids":["https://openalex.org/I195460627"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Huanqi Cao","orcid":"https://orcid.org/0000-0002-3092-1578"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huanqi Cao","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-3092-1578","affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090119683","display_name":"Rui Tang","orcid":"https://orcid.org/0009-0003-5935-4217"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ruibai Tang","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0003-5935-4217","affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Yidong Chen","orcid":"https://orcid.org/0000-0001-6207-5049"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yidong Chen","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-6207-5049","affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055665761","display_name":"Jiping Yu","orcid":"https://orcid.org/0000-0002-6643-4405"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiping Yu","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-6643-4405","affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124097264","display_name":"Yang Li","orcid":null},"institutions":[{"id":"https://openalex.org/I4210156165","display_name":"Lenovo (China)","ror":"https://ror.org/04srd9d93","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210156165"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yang Li","raw_affiliation_strings":["Lenovo Research, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Lenovo Research, China","institution_ids":["https://openalex.org/I4210156165"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089216253","display_name":"Chao Jiang","orcid":"https://orcid.org/0000-0001-5421-9671"},"institutions":[{"id":"https://openalex.org/I4210156165","display_name":"Lenovo (China)","ror":"https://ror.org/04srd9d93","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210156165"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chao Jiang","raw_affiliation_strings":["Lenovo Research, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Lenovo Research, China","institution_ids":["https://openalex.org/I4210156165"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067847276","display_name":"Limin Xiao","orcid":"https://orcid.org/0000-0002-5076-8208"},"institutions":[{"id":"https://openalex.org/I4210156165","display_name":"Lenovo (China)","ror":"https://ror.org/04srd9d93","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210156165"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Limin Xiao","raw_affiliation_strings":["Lenovo Research, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Lenovo Research, China","institution_ids":["https://openalex.org/I4210156165"]}]},{"author_position":"last","author":{"id":null,"display_name":"Jidong Zhai","orcid":"https://orcid.org/0000-0002-7656-6428"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jidong Zhai","raw_affiliation_strings":["Tsinghua University, China"],"raw_orcid":"https://orcid.org/0000-0002-7656-6428","affiliations":[{"raw_affiliation_string":"Tsinghua University, China","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":11,"corresponding_author_ids":["https://openalex.org/A5124067592"],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.12658859,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"452","last_page":"465"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9147999882698059,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9147999882698059,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.01759999990463257,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10126","display_name":"Logic, programming, and type systems","score":0.017000000923871994,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/automatic-differentiation","display_name":"Automatic differentiation","score":0.7412999868392944},{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.7075999975204468},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.6672999858856201},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.6172000169754028},{"id":"https://openalex.org/keywords/restructuring","display_name":"Restructuring","score":0.5357000231742859},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.5054000020027161},{"id":"https://openalex.org/keywords/variable","display_name":"Variable (mathematics)","score":0.4706999957561493},{"id":"https://openalex.org/keywords/chain","display_name":"Chain (unit)","score":0.36309999227523804}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8069999814033508},{"id":"https://openalex.org/C133512626","wikidata":"https://www.wikidata.org/wiki/Q787371","display_name":"Automatic differentiation","level":3,"score":0.7412999868392944},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.7075999975204468},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.6672999858856201},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.6172000169754028},{"id":"https://openalex.org/C45237549","wikidata":"https://www.wikidata.org/wiki/Q1376796","display_name":"Restructuring","level":2,"score":0.5357000231742859},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.5054000020027161},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.4900999963283539},{"id":"https://openalex.org/C182365436","wikidata":"https://www.wikidata.org/wiki/Q50701","display_name":"Variable (mathematics)","level":2,"score":0.4706999957561493},{"id":"https://openalex.org/C199185054","wikidata":"https://www.wikidata.org/wiki/Q552299","display_name":"Chain (unit)","level":2,"score":0.36309999227523804},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.36230000853538513},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3303000032901764},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.3224000036716461},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.3174999952316284},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.31380000710487366},{"id":"https://openalex.org/C133162039","wikidata":"https://www.wikidata.org/wiki/Q1061077","display_name":"Code generation","level":3,"score":0.3124000132083893},{"id":"https://openalex.org/C2988963302","wikidata":"https://www.wikidata.org/wiki/Q629206","display_name":"Program code","level":2,"score":0.30469998717308044},{"id":"https://openalex.org/C155386361","wikidata":"https://www.wikidata.org/wiki/Q1649571","display_name":"Process control","level":3,"score":0.2992999851703644},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2937000095844269},{"id":"https://openalex.org/C93058836","wikidata":"https://www.wikidata.org/wiki/Q1453572","display_name":"Chain code","level":3,"score":0.2800000011920929},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.27239999175071716},{"id":"https://openalex.org/C138958017","wikidata":"https://www.wikidata.org/wiki/Q190087","display_name":"Data type","level":2,"score":0.25540000200271606},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.25099998712539673}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3774934.3786418","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3774934.3786418","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 31st ACM SIGPLAN Annual Symposium on Principles and Practice of Parallel Programming","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W192546733","https://openalex.org/W199058730","https://openalex.org/W1965256357","https://openalex.org/W1967134278","https://openalex.org/W2031070741","https://openalex.org/W2071746250","https://openalex.org/W2098688018","https://openalex.org/W2148008896","https://openalex.org/W2318529993","https://openalex.org/W2387022868","https://openalex.org/W2522802439","https://openalex.org/W2718955078","https://openalex.org/W2724948248","https://openalex.org/W2791901282","https://openalex.org/W2793476006","https://openalex.org/W2810610794","https://openalex.org/W2990173985","https://openalex.org/W3035917376","https://openalex.org/W3195241200","https://openalex.org/W3210510236","https://openalex.org/W3211257750","https://openalex.org/W3214712237","https://openalex.org/W4221146591","https://openalex.org/W4281710230","https://openalex.org/W4310744122","https://openalex.org/W4321636553"],"related_works":[],"abstract_inverted_index":{"Automatic":[0],"Differentiation":[1],"(AD)":[2],"is":[3],"a":[4,20,38],"technique":[5],"that":[6],"computes":[7],"the":[8,16,43,56,79],"derivatives":[9],"of":[10],"numerical":[11],"programs":[12,36],"by":[13],"systematically":[14],"applying":[15],"chain":[17],"rule,":[18],"playing":[19],"critical":[21],"role":[22],"in":[23],"domains":[24],"such":[25],"as":[26],"machine":[27],"learning,":[28],"simulation,":[29],"and":[30,54,70],"control":[31,81],"systems.":[32],"However,":[33],"parallelizing":[34],"differentiated":[35],"remains":[37],"significant":[39],"challenge":[40],"due":[41],"to":[42,87],"conflict":[44],"between":[45],"tapes":[46],"(a":[47],"data":[48,76],"structure":[49],"for":[50],"intermediate":[51],"variable":[52],"storage)":[53],"summations:":[55],"differentiation":[57],"process":[58],"inherently":[59],"introduces":[60],"inter-thread":[61],"summation":[62],"patterns,":[63],"which":[64],"require":[65],"prohibitively":[66],"expensive":[67],"atomic":[68],"operations;":[69],"traditional":[71],"tape":[72],"designs":[73],"tightly":[74],"couple":[75],"retrieval":[77],"with":[78],"program\u2019s":[80],"flow,":[82],"preventing":[83],"code":[84],"restructuring":[85],"needed":[86],"eliminate":[88],"these":[89],"costly":[90],"dependencies.":[91]},"counts_by_year":[],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2026-01-29T00:00:00"}
