{"id":"https://openalex.org/W7162698496","doi":"https://doi.org/10.48550/arxiv.2605.28426","title":"Fault Tolerance of Accelerated Asynchronous Fixed-Point Iterations on Flexible Computing Infrastructure","display_name":"Fault Tolerance of Accelerated Asynchronous Fixed-Point Iterations on Flexible Computing Infrastructure","publication_year":2026,"publication_date":"2026-05-27","ids":{"openalex":"https://openalex.org/W7162698496","doi":"https://doi.org/10.48550/arxiv.2605.28426"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.28426","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.28426","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.28426","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5125717016","display_name":"Evan Coleman","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Coleman, Evan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5090093092","display_name":"Masha Sosonkina","orcid":"https://orcid.org/0009-0005-0223-397X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sosonkina, Masha","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10772","display_name":"Distributed systems and fault tolerance","score":0.7251999974250793,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10772","display_name":"Distributed systems and fault tolerance","score":0.7251999974250793,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.08789999783039093,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.05889999866485596,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/asynchronous-communication","display_name":"Asynchronous communication","score":0.9180999994277954},{"id":"https://openalex.org/keywords/synchronizer","display_name":"Synchronizer","score":0.6858000159263611},{"id":"https://openalex.org/keywords/asynchrony","display_name":"Asynchrony (computer programming)","score":0.6309000253677368},{"id":"https://openalex.org/keywords/iterated-function","display_name":"Iterated function","score":0.6226999759674072},{"id":"https://openalex.org/keywords/fault-tolerance","display_name":"Fault tolerance","score":0.5641000270843506},{"id":"https://openalex.org/keywords/bounded-function","display_name":"Bounded function","score":0.5260999798774719},{"id":"https://openalex.org/keywords/perturbation","display_name":"Perturbation (astronomy)","score":0.5217999815940857},{"id":"https://openalex.org/keywords/acceleration","display_name":"Acceleration","score":0.4999000132083893},{"id":"https://openalex.org/keywords/smoothness","display_name":"Smoothness","score":0.4156999886035919}],"concepts":[{"id":"https://openalex.org/C151319957","wikidata":"https://www.wikidata.org/wiki/Q752739","display_name":"Asynchronous communication","level":2,"score":0.9180999994277954},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7538999915122986},{"id":"https://openalex.org/C66727535","wikidata":"https://www.wikidata.org/wiki/Q7662199","display_name":"Synchronizer","level":2,"score":0.6858000159263611},{"id":"https://openalex.org/C2779019669","wikidata":"https://www.wikidata.org/wiki/Q25203946","display_name":"Asynchrony (computer programming)","level":3,"score":0.6309000253677368},{"id":"https://openalex.org/C140479938","wikidata":"https://www.wikidata.org/wiki/Q5254619","display_name":"Iterated function","level":2,"score":0.6226999759674072},{"id":"https://openalex.org/C63540848","wikidata":"https://www.wikidata.org/wiki/Q3140932","display_name":"Fault tolerance","level":2,"score":0.5641000270843506},{"id":"https://openalex.org/C34388435","wikidata":"https://www.wikidata.org/wiki/Q2267362","display_name":"Bounded function","level":2,"score":0.5260999798774719},{"id":"https://openalex.org/C177918212","wikidata":"https://www.wikidata.org/wiki/Q803623","display_name":"Perturbation (astronomy)","level":2,"score":0.5217999815940857},{"id":"https://openalex.org/C117896860","wikidata":"https://www.wikidata.org/wiki/Q11376","display_name":"Acceleration","level":2,"score":0.4999000132083893},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.4311000108718872},{"id":"https://openalex.org/C102634674","wikidata":"https://www.wikidata.org/wiki/Q868473","display_name":"Smoothness","level":2,"score":0.4156999886035919},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.400299996137619},{"id":"https://openalex.org/C26713055","wikidata":"https://www.wikidata.org/wiki/Q245962","display_name":"Implementation","level":2,"score":0.37459999322891235},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.3709000051021576},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.33410000801086426},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.3271999955177307},{"id":"https://openalex.org/C159694833","wikidata":"https://www.wikidata.org/wiki/Q2321565","display_name":"Iterative method","level":2,"score":0.3100000023841858},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.2890999913215637},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.28380000591278076},{"id":"https://openalex.org/C163415756","wikidata":"https://www.wikidata.org/wiki/Q126473","display_name":"Contraction (grammar)","level":2,"score":0.2831000089645386},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.27639999985694885},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.2757999897003174},{"id":"https://openalex.org/C191795146","wikidata":"https://www.wikidata.org/wiki/Q3878446","display_name":"Norm (philosophy)","level":2,"score":0.27140000462532043},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2694999873638153},{"id":"https://openalex.org/C118437007","wikidata":"https://www.wikidata.org/wiki/Q1017139","display_name":"Hybrid automatic repeat request","level":3,"score":0.26409998536109924},{"id":"https://openalex.org/C6802819","wikidata":"https://www.wikidata.org/wiki/Q1072174","display_name":"Linear system","level":2,"score":0.2639000117778778},{"id":"https://openalex.org/C183469790","wikidata":"https://www.wikidata.org/wiki/Q333501","display_name":"Crash","level":2,"score":0.2581000030040741},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.25619998574256897}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.28426","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.28426","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.28426","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.28426","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[{"score":0.723878800868988,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Asynchronous":[0],"iterative":[1],"methods":[2],"tolerate":[3],"straggling":[4],"processors":[5],"by":[6],"allowing":[7],"workers":[8],"to":[9,172],"proceed":[10],"with":[11,88,117,198],"stale":[12,148],"data,":[13],"but":[14,190],"at":[15],"a":[16,69,118,169],"cost:":[17],"the":[18,44,54,58,76,138,155,173,187,195,199,211,217,220],"iterates":[19],"become":[20],"inconsistent,":[21],"potentially":[22],"degrading":[23],"convergence.":[24],"We":[25,38,91,140],"investigate":[26],"whether":[27,123,224],"convergence":[28],"accelerators":[29],"such":[30],"as":[31,168],"Anderson":[32,128,182],"acceleration":[33,124,183,225],"compensate":[34],"for":[35,47,53],"this":[36],"degradation.":[37],"experimentally":[39],"study":[40],"three":[41],"fixed-point":[42,174],"iterations:":[43],"Jacobi":[45],"method":[46],"sparse":[48],"linear":[49],"systems,":[50],"value":[51],"iteration":[52],"Bellman":[55],"equation,":[56],"and":[57,81,85,111,162,180],"Hartree--Fock":[59],"self-consistent":[60],"field":[61],"(SCF)":[62,113],"iteration.":[63],"The":[64],"experiments":[65],"are":[66],"conducted":[67],"using":[68],"high-performance":[70],"execution":[71,102,116],"framework":[72],"Ray,":[73],"which":[74],"abstracts":[75],"complexity":[77],"of":[78,106,122,154,202,216,223],"distributed":[79],"systems":[80],"enables":[82],"code":[83],"parallelization":[84],"fault":[86],"injection":[87],"minimal":[89],"changes.":[90],"establish":[92],"two":[93,142],"main":[94],"results.":[95],"First,":[96],"straggler":[97],"tolerance":[98],"is":[99,125,219],"universal:":[100],"asynchronous":[101,227],"provides":[103],"wall-clock":[104],"speedups":[105],"$2.9\\times$":[107],"(Jacobi),":[108],"$7.7\\times$":[109],"(VI),":[110],"$16.9\\times$":[112],"over":[114],"synchronous":[115],"100\\,ms-delayed":[119],"worker,":[120],"independent":[121],"used.":[126],"Second,":[127],"acceleration's":[129],"effectiveness":[130],"under":[131,186,194],"asynchrony":[132],"depends":[133],"on":[134],"where":[135,147,165],"staleness":[136,143,166],"enters":[137],"computation.":[139],"identify":[141],"mechanisms:":[144],"iterate-level":[145],"corruption,":[146],"worker":[149],"returns":[150],"directly":[151],"overwrite":[152],"portions":[153],"accelerated":[156],"iterate":[157],"(as":[158,177],"in":[159,178],"block":[160],"Jacobi),":[161],"evaluation-level":[163],"perturbation,":[164],"acts":[167],"bounded":[170],"perturbation":[171,200],"map":[175],"evaluation":[176],"VI":[179],"SCF).":[181],"fails":[184],"categorically":[185],"first":[188],"mechanism":[189],"retains":[191],"its":[192],"benefits":[193],"second,":[196],"consistent":[197],"analysis":[201],"Toth":[203],"et":[204],"al.\\":[205],"(2017).":[206],"This":[207],"distinction,":[208],"rather":[209],"than":[210],"contraction":[212],"norm":[213],"or":[214],"smoothness":[215],"map,":[218],"primary":[221],"determinant":[222],"survives":[226],"execution.":[228]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2026-05-29T00:00:00"}
