{"id":"https://openalex.org/W4407164524","doi":"https://doi.org/10.2478/jaiscr-2025-0006","title":"Accelerating Neural Network Training with FSGQR: A Scalable and High-Performance Alternative to Adam","display_name":"Accelerating Neural Network Training with FSGQR: A Scalable and High-Performance Alternative to Adam","publication_year":2025,"publication_date":"2025-02-05","ids":{"openalex":"https://openalex.org/W4407164524","doi":"https://doi.org/10.2478/jaiscr-2025-0006"},"language":"en","primary_location":{"id":"doi:10.2478/jaiscr-2025-0006","is_oa":true,"landing_page_url":"https://doi.org/10.2478/jaiscr-2025-0006","pdf_url":"https://reference-global.com/2/v2/download/article/10.2478/jaiscr-2025-0006.pdf","source":{"id":"https://openalex.org/S4210223945","display_name":"Journal of Artificial Intelligence and Soft Computing Research","issn_l":"2083-2567","issn":["2083-2567","2449-6499"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310317241","host_organization_name":"Polish Neural Network Society, the University of Social Sciences in Lodz & Czestochowa University of Technology","host_organization_lineage":["https://openalex.org/P4310317241"],"host_organization_lineage_names":["Polish Neural Network Society, the University of Social Sciences in Lodz & Czestochowa University of Technology"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Artificial Intelligence and Soft Computing Research","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://reference-global.com/2/v2/download/article/10.2478/jaiscr-2025-0006.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5068798625","display_name":"Jaros\u0142aw Bilski","orcid":"https://orcid.org/0000-0003-1769-3934"},"institutions":[{"id":"https://openalex.org/I130294970","display_name":"Cz\u0119stochowa University of Technology","ror":"https://ror.org/046awyn59","country_code":"PL","type":"education","lineage":["https://openalex.org/I130294970"]}],"countries":["PL"],"is_corresponding":true,"raw_author_name":"Jaros\u0142aw Bilski","raw_affiliation_strings":["Department of Artificial Intelligence , Cz\u0119stochowa University of Technology , al. Armii Krajowej 36 , Cz\u0119stochowa , Poland"],"raw_orcid":"https://orcid.org/0000-0003-1769-3934","affiliations":[{"raw_affiliation_string":"Department of Artificial Intelligence , Cz\u0119stochowa University of Technology , al. Armii Krajowej 36 , Cz\u0119stochowa , Poland","institution_ids":["https://openalex.org/I130294970"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014333787","display_name":"Bartosz Kowalczyk","orcid":"https://orcid.org/0000-0002-7683-9051"},"institutions":[{"id":"https://openalex.org/I130294970","display_name":"Cz\u0119stochowa University of Technology","ror":"https://ror.org/046awyn59","country_code":"PL","type":"education","lineage":["https://openalex.org/I130294970"]}],"countries":["PL"],"is_corresponding":false,"raw_author_name":"Bartosz Kowalczyk","raw_affiliation_strings":["Department of Artificial Intelligence , Cz\u0119stochowa University of Technology , al. Armii Krajowej 36 , Cz\u0119stochowa , Poland"],"raw_orcid":"https://orcid.org/0000-0002-7683-9051","affiliations":[{"raw_affiliation_string":"Department of Artificial Intelligence , Cz\u0119stochowa University of Technology , al. Armii Krajowej 36 , Cz\u0119stochowa , Poland","institution_ids":["https://openalex.org/I130294970"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091709635","display_name":"Ludmila Dymova","orcid":"https://orcid.org/0000-0002-5387-9990"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ludmila Dymova","raw_affiliation_strings":["Information Technology Institute , SAN University , , \u0141\u00f3d\u017a , Poland"],"raw_orcid":"https://orcid.org/0000-0002-5387-9990","affiliations":[{"raw_affiliation_string":"Information Technology Institute , SAN University , , \u0141\u00f3d\u017a , Poland","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5054421000","display_name":"Min Xiao","orcid":"https://orcid.org/0000-0002-8992-153X"},"institutions":[{"id":"https://openalex.org/I41198531","display_name":"Nanjing University of Posts and Telecommunications","ror":"https://ror.org/043bpky34","country_code":"CN","type":"education","lineage":["https://openalex.org/I41198531"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Min Xiao","raw_affiliation_strings":["College of Automation & College of Artificial Intelligence Nanjing University of Posts and Telecommunications Nanjing , China"],"raw_orcid":"https://orcid.org/0000-0002-8992-153X","affiliations":[{"raw_affiliation_string":"College of Automation & College of Artificial Intelligence Nanjing University of Posts and Telecommunications Nanjing , China","institution_ids":["https://openalex.org/I41198531"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5068798625"],"corresponding_institution_ids":["https://openalex.org/I130294970"],"apc_list":null,"apc_paid":null,"fwci":8.5044,"has_fulltext":true,"cited_by_count":4,"citation_normalized_percentile":{"value":0.96862686,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":98},"biblio":{"volume":"15","issue":"2","first_page":"95","last_page":"113"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10057","display_name":"Face and Expression Recognition","score":0.9853000044822693,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.6133437752723694},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.609128475189209},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5300383567810059},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.48740676045417786},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3905310034751892},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.34085384011268616},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.11187335848808289}],"concepts":[{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.6133437752723694},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.609128475189209},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5300383567810059},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.48740676045417786},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3905310034751892},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.34085384011268616},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.11187335848808289},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C153294291","wikidata":"https://www.wikidata.org/wiki/Q25261","display_name":"Meteorology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.2478/jaiscr-2025-0006","is_oa":true,"landing_page_url":"https://doi.org/10.2478/jaiscr-2025-0006","pdf_url":"https://reference-global.com/2/v2/download/article/10.2478/jaiscr-2025-0006.pdf","source":{"id":"https://openalex.org/S4210223945","display_name":"Journal of Artificial Intelligence and Soft Computing Research","issn_l":"2083-2567","issn":["2083-2567","2449-6499"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310317241","host_organization_name":"Polish Neural Network Society, the University of Social Sciences in Lodz & Czestochowa University of Technology","host_organization_lineage":["https://openalex.org/P4310317241"],"host_organization_lineage_names":["Polish Neural Network Society, the University of Social Sciences in Lodz & Czestochowa University of Technology"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Artificial Intelligence and Soft Computing Research","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.2478/jaiscr-2025-0006","is_oa":true,"landing_page_url":"https://doi.org/10.2478/jaiscr-2025-0006","pdf_url":"https://reference-global.com/2/v2/download/article/10.2478/jaiscr-2025-0006.pdf","source":{"id":"https://openalex.org/S4210223945","display_name":"Journal of Artificial Intelligence and Soft Computing Research","issn_l":"2083-2567","issn":["2083-2567","2449-6499"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310317241","host_organization_name":"Polish Neural Network Society, the University of Social Sciences in Lodz & Czestochowa University of Technology","host_organization_lineage":["https://openalex.org/P4310317241"],"host_organization_lineage_names":["Polish Neural Network Society, the University of Social Sciences in Lodz & Czestochowa University of Technology"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Artificial Intelligence and Soft Computing Research","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4407164524.pdf"},"referenced_works_count":42,"referenced_works":["https://openalex.org/W6908809","https://openalex.org/W50270055","https://openalex.org/W148691561","https://openalex.org/W190213900","https://openalex.org/W818067050","https://openalex.org/W1484259480","https://openalex.org/W1522301498","https://openalex.org/W1988720110","https://openalex.org/W2019282798","https://openalex.org/W2036050714","https://openalex.org/W2043039667","https://openalex.org/W2058663814","https://openalex.org/W2065024490","https://openalex.org/W2069232849","https://openalex.org/W2074346829","https://openalex.org/W2105050785","https://openalex.org/W2106479238","https://openalex.org/W2112796928","https://openalex.org/W2117825133","https://openalex.org/W2141801655","https://openalex.org/W2146502635","https://openalex.org/W2155482699","https://openalex.org/W2165063012","https://openalex.org/W2494386023","https://openalex.org/W2759483166","https://openalex.org/W2761561821","https://openalex.org/W2769156605","https://openalex.org/W2794029453","https://openalex.org/W2901185836","https://openalex.org/W2945464279","https://openalex.org/W2945650117","https://openalex.org/W2962949934","https://openalex.org/W3205374070","https://openalex.org/W4286722589","https://openalex.org/W4310136640","https://openalex.org/W4323928528","https://openalex.org/W4381851563","https://openalex.org/W4390191112","https://openalex.org/W4394582863","https://openalex.org/W4401094021","https://openalex.org/W6888914244","https://openalex.org/W6964248249"],"related_works":["https://openalex.org/W230091440","https://openalex.org/W2233261550","https://openalex.org/W2810751659","https://openalex.org/W258997015","https://openalex.org/W2997094352","https://openalex.org/W2389214306","https://openalex.org/W3216976533","https://openalex.org/W100620283","https://openalex.org/W2965083567","https://openalex.org/W2495260952"],"abstract_inverted_index":{"Abstract":[0],"This":[1],"paper":[2,135],"introduces":[3],"a":[4,16,162,197],"significant":[5],"advancement":[6],"in":[7,21,111,129,187],"neural":[8,152,189],"network":[9,153],"training":[10,43,90,99,110,132,176],"algorithms":[11],"through":[12],"the":[13,28,69,83,120,130,141],"development":[14],"of":[15,40,50],"Fast":[17],"Scaled":[18],"Givens":[19],"rotations":[20],"QR":[22],"decomposition":[23],"(FSGQR)":[24],"method":[25],"based":[26],"on":[27],"recursive":[29],"least":[30],"squares":[31],"(RLS)":[32],"method.":[33],"The":[34,92,134,155,181],"algorithm":[35,93],"represents":[36],"an":[37],"optimized":[38],"variant":[39],"existing":[41],"rotation-based":[42],"approaches,":[44],"distinguished":[45],"by":[46],"its":[47],"complete":[48],"elimination":[49],"scale":[51],"factors":[52],"from":[53],"calculations":[54],"while":[55,101,123],"maintaining":[56,102],"mathematical":[57,138],"precision.":[58],"Through":[59],"extensive":[60,147],"experimentation":[61],"across":[62,150],"multiple":[63],"benchmarks,":[64],"including":[65],"complex":[66],"tasks":[67],"like":[68],"MNIST":[70,131],"digit":[71],"recognition":[72,127],"and":[73,87,146],"concrete":[74],"strength":[75],"prediction,":[76],"FSGQR":[77,108,160],"demonstrates":[78],"superior":[79],"performance":[80],"compared":[81,118],"to":[82,113,119,165],"widely-used":[84],"ADAM":[85,121],"optimizer":[86],"other":[88],"conventional":[89],"methods.":[91],"achieves":[94],"faster":[95],"convergence":[96,177],"with":[97,191],"fewer":[98,116],"epochs":[100,117],"or":[103],"improving":[104],"accuracy.In":[105],"some":[106],"tasks,":[107],"completed":[109],"up":[112],"five":[114],"times":[115],"algorithm,":[122],"it":[124,196],"achieved":[125],"higher":[126],"accuracy":[128],"set.":[133],"provides":[136],"comprehensive":[137],"foundations":[139],"for":[140,172,200],"optimization,":[142],"detailed":[143],"implementation":[144],"guidelines,":[145],"empirical":[148],"validation":[149],"various":[151],"architectures.":[154],"results":[156],"conclusively":[157],"demonstrate":[158],"that":[159],"offers":[161],"compelling":[163],"alternative":[164],"current":[166],"deep":[167],"learning":[168,203],"optimization":[169],"methods,":[170],"particularly":[171,185],"applications":[173],"requiring":[174],"rapid":[175],"without":[178],"sacrificing":[179],"accuracy.":[180],"algorithm\u2019s":[182],"effectiveness":[183],"is":[184],"noteworthy":[186],"feedforward":[188],"networks":[190],"differentiable":[192],"activation":[193],"functions,":[194],"making":[195],"valuable":[198],"tool":[199],"modern":[201],"machine":[202],"applications.":[204]},"counts_by_year":[{"year":2025,"cited_by_count":4}],"updated_date":"2026-05-01T06:04:38.248271","created_date":"2025-10-10T00:00:00"}
