{"id":"https://openalex.org/W2910572885","doi":"https://doi.org/10.1109/itw.2018.8613445","title":"Generalization error bounds using Wasserstein distances","display_name":"Generalization error bounds using Wasserstein distances","publication_year":2018,"publication_date":"2018-11-01","ids":{"openalex":"https://openalex.org/W2910572885","doi":"https://doi.org/10.1109/itw.2018.8613445","mag":"2910572885"},"language":"en","primary_location":{"id":"doi:10.1109/itw.2018.8613445","is_oa":false,"landing_page_url":"https://doi.org/10.1109/itw.2018.8613445","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 IEEE Information Theory Workshop (ITW)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5052441625","display_name":"Adrian Tovar Lopez","orcid":null},"institutions":[{"id":"https://openalex.org/I135310074","display_name":"University of Wisconsin\u2013Madison","ror":"https://ror.org/01y2jtd41","country_code":"US","type":"education","lineage":["https://openalex.org/I135310074"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Adrian Tovar Lopez","raw_affiliation_strings":["Department of Mathematics, University of Wisconsin, Madison, WI"],"affiliations":[{"raw_affiliation_string":"Department of Mathematics, University of Wisconsin, Madison, WI","institution_ids":["https://openalex.org/I135310074"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5021502006","display_name":"Varun Jog","orcid":"https://orcid.org/0000-0003-4159-0900"},"institutions":[{"id":"https://openalex.org/I135310074","display_name":"University of Wisconsin\u2013Madison","ror":"https://ror.org/01y2jtd41","country_code":"US","type":"education","lineage":["https://openalex.org/I135310074"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Varun Jog","raw_affiliation_strings":["Department of Electrical Computer Engineering, University of Wisconsin, Madison, WI"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Computer Engineering, University of Wisconsin, Madison, WI","institution_ids":["https://openalex.org/I135310074"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5052441625"],"corresponding_institution_ids":["https://openalex.org/I135310074"],"apc_list":null,"apc_paid":null,"fwci":2.9319,"has_fulltext":false,"cited_by_count":38,"citation_normalized_percentile":{"value":0.9303921,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10500","display_name":"Sparse and Compressive Sensing Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.8628392815589905},{"id":"https://openalex.org/keywords/lipschitz-continuity","display_name":"Lipschitz continuity","score":0.6727855205535889},{"id":"https://openalex.org/keywords/bounded-function","display_name":"Bounded function","score":0.667234480381012},{"id":"https://openalex.org/keywords/mutual-information","display_name":"Mutual information","score":0.6546504497528076},{"id":"https://openalex.org/keywords/stochastic-gradient-descent","display_name":"Stochastic gradient descent","score":0.6012522578239441},{"id":"https://openalex.org/keywords/generalization-error","display_name":"Generalization error","score":0.5424999594688416},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.5127347707748413},{"id":"https://openalex.org/keywords/gradient-descent","display_name":"Gradient descent","score":0.4896305203437805},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.47595998644828796},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4598601162433624},{"id":"https://openalex.org/keywords/upper-and-lower-bounds","display_name":"Upper and lower bounds","score":0.4588085412979126},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.4477977156639099},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.35999125242233276},{"id":"https://openalex.org/keywords/applied-mathematics","display_name":"Applied mathematics","score":0.34241753816604614},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.19678309559822083},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.13838127255439758}],"concepts":[{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.8628392815589905},{"id":"https://openalex.org/C22324862","wikidata":"https://www.wikidata.org/wiki/Q652707","display_name":"Lipschitz continuity","level":2,"score":0.6727855205535889},{"id":"https://openalex.org/C34388435","wikidata":"https://www.wikidata.org/wiki/Q2267362","display_name":"Bounded function","level":2,"score":0.667234480381012},{"id":"https://openalex.org/C152139883","wikidata":"https://www.wikidata.org/wiki/Q252973","display_name":"Mutual information","level":2,"score":0.6546504497528076},{"id":"https://openalex.org/C206688291","wikidata":"https://www.wikidata.org/wiki/Q7617819","display_name":"Stochastic gradient descent","level":3,"score":0.6012522578239441},{"id":"https://openalex.org/C117765406","wikidata":"https://www.wikidata.org/wiki/Q5362437","display_name":"Generalization error","level":3,"score":0.5424999594688416},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.5127347707748413},{"id":"https://openalex.org/C153258448","wikidata":"https://www.wikidata.org/wiki/Q1199743","display_name":"Gradient descent","level":3,"score":0.4896305203437805},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.47595998644828796},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4598601162433624},{"id":"https://openalex.org/C77553402","wikidata":"https://www.wikidata.org/wiki/Q13222579","display_name":"Upper and lower bounds","level":2,"score":0.4588085412979126},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.4477977156639099},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.35999125242233276},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.34241753816604614},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.19678309559822083},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.13838127255439758},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/itw.2018.8613445","is_oa":false,"landing_page_url":"https://doi.org/10.1109/itw.2018.8613445","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 IEEE Information Theory Workshop (ITW)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W607505555","https://openalex.org/W1585160083","https://openalex.org/W1811750039","https://openalex.org/W2099111195","https://openalex.org/W2131542408","https://openalex.org/W2141761557","https://openalex.org/W2148603752","https://openalex.org/W2162341153","https://openalex.org/W2167433878","https://openalex.org/W2210387432","https://openalex.org/W2258658829","https://openalex.org/W2541283300","https://openalex.org/W2592651140","https://openalex.org/W2617539226","https://openalex.org/W2736970300","https://openalex.org/W2790390983","https://openalex.org/W2962702650","https://openalex.org/W2963092340","https://openalex.org/W2963650125","https://openalex.org/W2963794891","https://openalex.org/W2963862692","https://openalex.org/W2964106499","https://openalex.org/W3005141333","https://openalex.org/W3112350859","https://openalex.org/W4236362309","https://openalex.org/W4285719527","https://openalex.org/W4293583552","https://openalex.org/W4293774175","https://openalex.org/W6635108014","https://openalex.org/W6638214083","https://openalex.org/W6679563152","https://openalex.org/W6684809622","https://openalex.org/W6692563690","https://openalex.org/W6734280532","https://openalex.org/W6738074204","https://openalex.org/W6741472820","https://openalex.org/W6748601875","https://openalex.org/W6751754507","https://openalex.org/W6786708663","https://openalex.org/W7034108470"],"related_works":["https://openalex.org/W2947416323","https://openalex.org/W4288346661","https://openalex.org/W4206903459","https://openalex.org/W2754816816","https://openalex.org/W4366280654","https://openalex.org/W3160167280","https://openalex.org/W4231621013","https://openalex.org/W4362706668","https://openalex.org/W3008318776","https://openalex.org/W1977633006"],"abstract_inverted_index":{"Generalization":[0],"error":[1,31,62],"of":[2,49,65,73,80],"a":[3,66,81],"learning":[4,98],"algorithm":[5],"characterizes":[6],"the":[7,37,42,46,60,71,78],"gap":[8],"between":[9,41],"an":[10,50],"algorithm's":[11],"performance":[12,17],"on":[13,18,59],"test":[14],"data":[15],"versus":[16],"training":[19],"data.":[20],"In":[21,52],"recent":[22],"work,":[23],"Xu":[24],"&":[25],"Raginsky":[26],"[1]":[27],"showed":[28],"that":[29,111],"generalization":[30,61],"may":[32],"be":[33],"upper-":[34],"bounded":[35],"using":[36],"mutual":[38,87,121],"information":[39],"I(S;W)":[40],"input":[43],"S":[44,74],"and":[45,75],"output":[47],"W":[48,76],"algorithm.":[51],"this":[53],"paper,":[54],"we":[55,109],"derive":[56],"upper":[57],"bounds":[58,92,117],"in":[63,112],"terms":[64],"certain":[67],"Wasserstein":[68],"distance":[69],"involving":[70],"distributions":[72],"under":[77],"assumption":[79],"Lipschitz":[82],"continuous":[83],"loss":[84],"function.":[85],"Unlike":[86],"information-based":[88,122],"bounds,":[89],"these":[90,116],"new":[91],"are":[93,118],"useful":[94],"even":[95],"for":[96,101],"deterministic":[97],"algorithms,":[99],"or":[100],"algorithms":[102],"such":[103],"as":[104],"stochastic":[105],"gradient":[106],"descent.":[107],"Moreover,":[108],"show":[110],"some":[113],"natural":[114],"cases":[115],"tighter":[119],"than":[120],"bounds.":[123]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":5},{"year":2021,"cited_by_count":12},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
