{"id":"https://openalex.org/W3134406394","doi":"https://doi.org/10.1007/978-3-030-99336-8_1","title":"Categorical Foundations of Gradient-Based Learning","display_name":"Categorical Foundations of Gradient-Based Learning","publication_year":2022,"publication_date":"2022-01-01","ids":{"openalex":"https://openalex.org/W3134406394","doi":"https://doi.org/10.1007/978-3-030-99336-8_1","mag":"3134406394"},"language":"en","primary_location":{"id":"doi:10.1007/978-3-030-99336-8_1","is_oa":true,"landing_page_url":"https://doi.org/10.1007/978-3-030-99336-8_1","pdf_url":"https://link.springer.com/content/pdf/10.1007/978-3-030-99336-8_1.pdf","source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/978-3-030-99336-8_1.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5034149967","display_name":"G. S. H. Cruttwell","orcid":"https://orcid.org/0000-0001-8742-6263"},"institutions":[{"id":"https://openalex.org/I163902620","display_name":"Mount Allison University","ror":"https://ror.org/03grc6f14","country_code":"CA","type":"education","lineage":["https://openalex.org/I163902620"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Geoffrey S. H. Cruttwell","raw_affiliation_strings":["Mount Allison University, Sackville, Canada"],"raw_orcid":"https://orcid.org/0000-0001-8742-6263","affiliations":[{"raw_affiliation_string":"Mount Allison University, Sackville, Canada","institution_ids":["https://openalex.org/I163902620"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041889305","display_name":"Bruno Gavranovi\u0107","orcid":"https://orcid.org/0000-0002-6069-5727"},"institutions":[{"id":"https://openalex.org/I181647926","display_name":"University of Strathclyde","ror":"https://ror.org/00n3w3b69","country_code":"GB","type":"education","lineage":["https://openalex.org/I181647926"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Bruno Gavranovi\u0107","raw_affiliation_strings":["University of Strathclyde, Glasgow, United Kingdom"],"raw_orcid":"https://orcid.org/0000-0002-6069-5727","affiliations":[{"raw_affiliation_string":"University of Strathclyde, Glasgow, United Kingdom","institution_ids":["https://openalex.org/I181647926"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044225957","display_name":"Neil Ghani","orcid":null},"institutions":[{"id":"https://openalex.org/I181647926","display_name":"University of Strathclyde","ror":"https://ror.org/00n3w3b69","country_code":"GB","type":"education","lineage":["https://openalex.org/I181647926"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Neil Ghani","raw_affiliation_strings":["University of Strathclyde, Glasgow, United Kingdom"],"raw_orcid":"https://orcid.org/0000-0002-3988-2560","affiliations":[{"raw_affiliation_string":"University of Strathclyde, Glasgow, United Kingdom","institution_ids":["https://openalex.org/I181647926"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034202725","display_name":"P. Wilson","orcid":"https://orcid.org/0000-0003-3575-135X"},"institutions":[{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Paul Wilson","raw_affiliation_strings":["University College London, London, United Kingdom"],"raw_orcid":"https://orcid.org/0000-0003-3575-135X","affiliations":[{"raw_affiliation_string":"University College London, London, United Kingdom","institution_ids":["https://openalex.org/I45129253"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5016173850","display_name":"Fabio Zanasi","orcid":"https://orcid.org/0000-0001-6457-1345"},"institutions":[{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Fabio Zanasi","raw_affiliation_strings":["University College London, London, United Kingdom"],"raw_orcid":"https://orcid.org/0000-0001-6457-1345","affiliations":[{"raw_affiliation_string":"University College London, London, United Kingdom","institution_ids":["https://openalex.org/I45129253"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":{"value":5000,"currency":"EUR","value_usd":5392},"apc_paid":{"value":5000,"currency":"EUR","value_usd":5392},"fwci":27.8602,"has_fulltext":true,"cited_by_count":50,"citation_normalized_percentile":{"value":0.99822891,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"28"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12536","display_name":"Topological and Geometric Data Analysis","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12536","display_name":"Topological and Geometric Data Analysis","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12808","display_name":"Ferroelectric and Negative Capacitance Devices","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7145311832427979},{"id":"https://openalex.org/keywords/gradient-descent","display_name":"Gradient descent","score":0.6399303078651428},{"id":"https://openalex.org/keywords/softmax-function","display_name":"Softmax function","score":0.5899717807769775},{"id":"https://openalex.org/keywords/categorical-variable","display_name":"Categorical variable","score":0.5146799683570862},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4941571056842804},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.4823024272918701},{"id":"https://openalex.org/keywords/variety","display_name":"Variety (cybernetics)","score":0.4752785265445709},{"id":"https://openalex.org/keywords/python","display_name":"Python (programming language)","score":0.45321977138519287},{"id":"https://openalex.org/keywords/entropy","display_name":"Entropy (arrow of time)","score":0.4303521513938904},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.4058391749858856},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.30575239658355713},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.27971917390823364},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.14286556839942932}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7145311832427979},{"id":"https://openalex.org/C153258448","wikidata":"https://www.wikidata.org/wiki/Q1199743","display_name":"Gradient descent","level":3,"score":0.6399303078651428},{"id":"https://openalex.org/C188441871","wikidata":"https://www.wikidata.org/wiki/Q7554146","display_name":"Softmax function","level":3,"score":0.5899717807769775},{"id":"https://openalex.org/C5274069","wikidata":"https://www.wikidata.org/wiki/Q2285707","display_name":"Categorical variable","level":2,"score":0.5146799683570862},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4941571056842804},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.4823024272918701},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.4752785265445709},{"id":"https://openalex.org/C519991488","wikidata":"https://www.wikidata.org/wiki/Q28865","display_name":"Python (programming language)","level":2,"score":0.45321977138519287},{"id":"https://openalex.org/C106301342","wikidata":"https://www.wikidata.org/wiki/Q4117933","display_name":"Entropy (arrow of time)","level":2,"score":0.4303521513938904},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4058391749858856},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.30575239658355713},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.27971917390823364},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.14286556839942932},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1007/978-3-030-99336-8_1","is_oa":true,"landing_page_url":"https://doi.org/10.1007/978-3-030-99336-8_1","pdf_url":"https://link.springer.com/content/pdf/10.1007/978-3-030-99336-8_1.pdf","source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},{"id":"pmh:oai:cris.unibo.it:11585/903819","is_oa":true,"landing_page_url":"https://hdl.handle.net/11585/903819","pdf_url":null,"source":{"id":"https://openalex.org/S4306402579","display_name":"Archivio istituzionale della ricerca (Alma Mater Studiorum Universit\u00e0 di Bologna)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210117483","host_organization_name":"Istituto di Ematologia di Bologna","host_organization_lineage":["https://openalex.org/I4210117483"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/conferenceObject"},{"id":"pmh:oai:eprints.ucl.ac.uk.OAI2:10160499","is_oa":false,"landing_page_url":"https://discovery.ucl.ac.uk/id/eprint/10160499/","pdf_url":null,"source":{"id":"https://openalex.org/S4306400024","display_name":"UCL Discovery (University College London)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I45129253","host_organization_name":"University College London","host_organization_lineage":["https://openalex.org/I45129253"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"     In:  Programming Languages and Systems. ESOP 2022.  (pp. pp. 1-28).  Springer: Cham, Switzerland. (2022)     ","raw_type":"Proceedings paper"}],"best_oa_location":{"id":"doi:10.1007/978-3-030-99336-8_1","is_oa":true,"landing_page_url":"https://doi.org/10.1007/978-3-030-99336-8_1","pdf_url":"https://link.springer.com/content/pdf/10.1007/978-3-030-99336-8_1.pdf","source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4854729358","display_name":null,"funder_award_id":"EP/V002376/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"}],"funders":[{"id":"https://openalex.org/F4320334593","display_name":"Natural Sciences and Engineering Research Council of Canada","ror":"https://ror.org/01h531d29"},{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3134406394.pdf","grobid_xml":"https://content.openalex.org/works/W3134406394.grobid-xml"},"referenced_works_count":63,"referenced_works":["https://openalex.org/W104184427","https://openalex.org/W764651262","https://openalex.org/W1498436455","https://openalex.org/W1585773866","https://openalex.org/W1644475622","https://openalex.org/W1721217740","https://openalex.org/W1902934009","https://openalex.org/W1915485278","https://openalex.org/W1932198206","https://openalex.org/W1968796785","https://openalex.org/W1976985540","https://openalex.org/W1988720110","https://openalex.org/W1998219992","https://openalex.org/W2099471712","https://openalex.org/W2101032471","https://openalex.org/W2112796928","https://openalex.org/W2146502635","https://openalex.org/W2152013675","https://openalex.org/W2160144389","https://openalex.org/W2169393322","https://openalex.org/W2273348943","https://openalex.org/W2293138805","https://openalex.org/W2427497464","https://openalex.org/W2467659428","https://openalex.org/W2478429860","https://openalex.org/W2575704272","https://openalex.org/W2598985404","https://openalex.org/W2604511807","https://openalex.org/W2605287558","https://openalex.org/W2770981215","https://openalex.org/W2796413998","https://openalex.org/W2886174047","https://openalex.org/W2891718318","https://openalex.org/W2903382683","https://openalex.org/W2914196042","https://openalex.org/W2919932891","https://openalex.org/W2949987032","https://openalex.org/W2950993906","https://openalex.org/W2951220338","https://openalex.org/W2951469116","https://openalex.org/W2954487731","https://openalex.org/W2962793481","https://openalex.org/W2963031346","https://openalex.org/W2963989815","https://openalex.org/W2964121744","https://openalex.org/W2964300838","https://openalex.org/W2965268424","https://openalex.org/W2965438805","https://openalex.org/W2980693978","https://openalex.org/W3001712757","https://openalex.org/W3008225017","https://openalex.org/W3023645189","https://openalex.org/W3105507374","https://openalex.org/W3122708264","https://openalex.org/W3160160563","https://openalex.org/W3162302525","https://openalex.org/W3171764958","https://openalex.org/W4214731104","https://openalex.org/W4239510810","https://openalex.org/W4242934920","https://openalex.org/W6628533087","https://openalex.org/W6739886752","https://openalex.org/W6820762428"],"related_works":["https://openalex.org/W3107204728","https://openalex.org/W4287591324","https://openalex.org/W4226420367","https://openalex.org/W2980176872","https://openalex.org/W2962876041","https://openalex.org/W3090555870","https://openalex.org/W3108503355","https://openalex.org/W2249953602","https://openalex.org/W2801655600","https://openalex.org/W2912971006"],"abstract_inverted_index":{"Abstract":[0],"We":[1],"propose":[2],"a":[3,24,32,48],"categorical":[4],"semantics":[5],"of":[6,13,34,50,83,94,103],"gradient-based":[7,70],"machine":[8],"learning":[9,71],"algorithms":[10,37],"in":[11,81,90,109],"terms":[12],"lenses,":[14],"parametric":[15],"maps,":[16],"and":[17,27,42,56,65,86],"reverse":[18],"derivative":[19],"categories.":[20],"This":[21],"foundation":[22],"provides":[23],"powerful":[25],"explanatory":[26],"unifying":[28],"framework:":[29],"it":[30],"encompasses":[31],"variety":[33,49],"gradient":[35],"descent":[36],"such":[38,53],"as":[39,45,47,54],"ADAM,":[40],"AdaGrad,":[41],"Nesterov":[43],"momentum,":[44],"well":[46],"loss":[51],"functions":[52],"MSE":[55],"Softmax":[57],"cross-entropy,":[58],"shedding":[59],"new":[60],"light":[61],"on":[62],"their":[63],"similarities":[64],"differences.":[66],"Our":[67],"approach":[68],"to":[69],"has":[72],"examples":[73],"generalising":[74],"beyond":[75],"the":[76,91,100],"familiar":[77],"continuous":[78],"domains":[79],"(modelled":[80],"categories":[82],"smooth":[84],"maps)":[85],"can":[87],"be":[88],"realized":[89],"discrete":[92],"setting":[93],"boolean":[95],"circuits.":[96],"Finally,":[97],"we":[98],"demonstrate":[99],"practical":[101],"significance":[102],"our":[104],"framework":[105],"with":[106],"an":[107],"implementation":[108],"Python.":[110]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":11},{"year":2024,"cited_by_count":13},{"year":2023,"cited_by_count":11},{"year":2022,"cited_by_count":7},{"year":2021,"cited_by_count":5}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
