{"id":"https://openalex.org/W2257410811","doi":"https://doi.org/10.1145/3365672","title":"A New Smooth Approximation to the Zero One Loss with a Probabilistic Interpretation","display_name":"A New Smooth Approximation to the Zero One Loss with a Probabilistic Interpretation","publication_year":2019,"publication_date":"2019-12-13","ids":{"openalex":"https://openalex.org/W2257410811","doi":"https://doi.org/10.1145/3365672","mag":"2257410811"},"language":"en","primary_location":{"id":"doi:10.1145/3365672","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3365672","pdf_url":null,"source":{"id":"https://openalex.org/S41523882","display_name":"ACM Transactions on Knowledge Discovery from Data","issn_l":"1556-4681","issn":["1556-4681","1556-472X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Knowledge Discovery from Data","raw_type":"journal-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1511.05643","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5027084430","display_name":"K. M. Azharul Hasan","orcid":"https://orcid.org/0000-0003-1228-9043"},"institutions":[{"id":"https://openalex.org/I45683168","display_name":"Polytechnique Montr\u00e9al","ror":"https://ror.org/05f8d4e86","country_code":"CA","type":"education","lineage":["https://openalex.org/I45683168"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"Md Kamrul Hasan","raw_affiliation_strings":["\u00c9cole Polytechnique Montr\u00e9al, QC, Canada","Ecole Polytechnique de Montr\u00e9al,"],"affiliations":[{"raw_affiliation_string":"\u00c9cole Polytechnique Montr\u00e9al, QC, Canada","institution_ids":["https://openalex.org/I45683168"]},{"raw_affiliation_string":"Ecole Polytechnique de Montr\u00e9al,","institution_ids":["https://openalex.org/I45683168"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5075885606","display_name":"Christopher Pal","orcid":"https://orcid.org/0000-0001-6534-2114"},"institutions":[{"id":"https://openalex.org/I45683168","display_name":"Polytechnique Montr\u00e9al","ror":"https://ror.org/05f8d4e86","country_code":"CA","type":"education","lineage":["https://openalex.org/I45683168"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Christopher Pal","raw_affiliation_strings":["Mila, \u00c9cole Polytechnique Montr\u00e9al, QC, Canada","Ecole Polytechnique de Montr\u00e9al,"],"affiliations":[{"raw_affiliation_string":"Mila, \u00c9cole Polytechnique Montr\u00e9al, QC, Canada","institution_ids":["https://openalex.org/I45683168"]},{"raw_affiliation_string":"Ecole Polytechnique de Montr\u00e9al,","institution_ids":["https://openalex.org/I45683168"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5027084430"],"corresponding_institution_ids":["https://openalex.org/I45683168"],"apc_list":null,"apc_paid":null,"fwci":0.1447,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.54431934,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":93},"biblio":{"volume":"14","issue":"1","first_page":"1","last_page":"28"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/hinge-loss","display_name":"Hinge loss","score":0.7754244804382324},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.5239356160163879},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5023114681243896},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.5009975433349609},{"id":"https://openalex.org/keywords/maxima-and-minima","display_name":"Maxima and minima","score":0.4703117907047272},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.44150179624557495},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.4286990761756897},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.41803693771362305},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.39810773730278015},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.39646559953689575},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.33450114727020264},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.324238121509552}],"concepts":[{"id":"https://openalex.org/C39891107","wikidata":"https://www.wikidata.org/wiki/Q5767098","display_name":"Hinge loss","level":3,"score":0.7754244804382324},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.5239356160163879},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5023114681243896},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.5009975433349609},{"id":"https://openalex.org/C186633575","wikidata":"https://www.wikidata.org/wiki/Q845060","display_name":"Maxima and minima","level":2,"score":0.4703117907047272},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44150179624557495},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.4286990761756897},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.41803693771362305},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.39810773730278015},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.39646559953689575},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.33450114727020264},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.324238121509552},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0}],"mesh":[],"locations_count":5,"locations":[{"id":"doi:10.1145/3365672","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3365672","pdf_url":null,"source":{"id":"https://openalex.org/S41523882","display_name":"ACM Transactions on Knowledge Discovery from Data","issn_l":"1556-4681","issn":["1556-4681","1556-472X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Knowledge Discovery from Data","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:1511.05643","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1511.05643","pdf_url":"https://arxiv.org/pdf/1511.05643","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"mag:2257410811","is_oa":true,"landing_page_url":"http://export.arxiv.org/pdf/1511.05643","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"pmh:oai:publications.polymtl.ca:44438","is_oa":false,"landing_page_url":"https://publications.polymtl.ca/44438/","pdf_url":null,"source":{"id":"https://openalex.org/S4306401013","display_name":"PolyPublie (\u00c9cole Polytechnique de Montr\u00e9al)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I45683168","host_organization_name":"Polytechnique Montr\u00e9al","host_organization_lineage":["https://openalex.org/I45683168"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Article de revue"},{"id":"doi:10.48550/arxiv.1511.05643","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1511.05643","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:1511.05643","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1511.05643","pdf_url":"https://arxiv.org/pdf/1511.05643","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320334593","display_name":"Natural Sciences and Engineering Research Council of Canada","ror":"https://ror.org/01h531d29"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2257410811.pdf","grobid_xml":"https://content.openalex.org/works/W2257410811.grobid-xml"},"referenced_works_count":37,"referenced_works":["https://openalex.org/W232191560","https://openalex.org/W1514928307","https://openalex.org/W1524688041","https://openalex.org/W1605479404","https://openalex.org/W1661786820","https://openalex.org/W1663973292","https://openalex.org/W1989494851","https://openalex.org/W1994720006","https://openalex.org/W2014374971","https://openalex.org/W2030843733","https://openalex.org/W2038663599","https://openalex.org/W2068221105","https://openalex.org/W2068696370","https://openalex.org/W2089394015","https://openalex.org/W2091364465","https://openalex.org/W2104193541","https://openalex.org/W2122537498","https://openalex.org/W2122825543","https://openalex.org/W2129809168","https://openalex.org/W2134507744","https://openalex.org/W2134829400","https://openalex.org/W2146666958","https://openalex.org/W2156909104","https://openalex.org/W2158460069","https://openalex.org/W2162152253","https://openalex.org/W2163608767","https://openalex.org/W2166765763","https://openalex.org/W2189481455","https://openalex.org/W2469023256","https://openalex.org/W2534029181","https://openalex.org/W2602025658","https://openalex.org/W2757686304","https://openalex.org/W2761674588","https://openalex.org/W3003518101","https://openalex.org/W3120740533","https://openalex.org/W4240374930","https://openalex.org/W6675672614"],"related_works":["https://openalex.org/W3004679435","https://openalex.org/W2110187108","https://openalex.org/W2273716988","https://openalex.org/W2092939062","https://openalex.org/W2921234600","https://openalex.org/W3035571418","https://openalex.org/W3163232994","https://openalex.org/W2184512081","https://openalex.org/W1763059553","https://openalex.org/W2152089394","https://openalex.org/W3041621985","https://openalex.org/W1633572439","https://openalex.org/W3203684173","https://openalex.org/W2373439703","https://openalex.org/W2107190016","https://openalex.org/W2587801071","https://openalex.org/W2618410756","https://openalex.org/W3123750365","https://openalex.org/W2124022122","https://openalex.org/W245192467"],"abstract_inverted_index":{"We":[0,83,174],"examine":[1],"a":[2,19,37,45,57,61,98,132,150,169,235],"new":[3],"form":[4],"of":[5,21,36,63,97,100,153,219],"smooth":[6],"approximation":[7],"to":[8,44,71,112,141,164,185,188],"the":[9,22,33,51,177,189,216],"zero":[10,52],"one":[11,53],"loss":[12,147],"in":[13,86],"which":[14,87],"learning":[15,126],"is":[16,29,68,123,179],"performed":[17],"using":[18,32,92,106,131],"reformulation":[20],"widely":[23,142],"used":[24,143],"logistic":[25,47,73,144,190,197],"function.":[26],"Our":[27,117,135],"approach":[28,67,178,241],"based":[30],"on":[31,149,202,214],"posterior":[34],"mean":[35],"novel":[38],"generalized":[39,46,70],"Beta-Bernoulli":[40],"formulation.":[41],"This":[42],"leads":[43],"function":[48],"that":[49,120,176],"approximates":[50],"loss,":[54],"but":[55],"retains":[56],"probabilistic":[58,236],"formulation":[59,221],"conferring":[60],"number":[62],"useful":[64],"properties.":[65],"The":[66],"easily":[69,76],"kernel":[72],"regression":[74],"and":[75,103,145,160,168,191,198,230,249],"integrated":[77,233],"into":[78,234],"methods":[79,148],"for":[80],"structured":[81,237],"prediction.":[82],"present":[84],"experiments":[85,118,136],"we":[88],"learn":[89],"such":[90],"models":[91,201],"an":[93],"optimization":[94,121],"method":[95],"consisting":[96],"combination":[99],"gradient":[101],"descent":[102,105],"coordinate":[104],"localized":[107],"grid":[108],"search":[109],"so":[110],"as":[111,180],"escape":[113],"from":[114,156],"local":[115],"minima.":[116],"indicate":[119],"quality":[122],"improved":[124,138,247],"when":[125,208,232],"metaparameters":[127],"are":[128],"themselves":[129],"optimized":[130],"validation":[133],"set.":[134],"show":[137],"performance":[139],"relative":[140],"hinge":[146,192],"wide":[151],"variety":[152],"problems":[154],"ranging":[155],"standard":[157],"UC":[158],"Irvine":[159],"libSVM":[161],"evaluation":[162],"datasets":[163],"product":[165],"review":[166],"predictions":[167],"visual":[170],"information":[171,251],"extraction":[172,252],"task.":[173],"observe":[175],"follows:":[181],"(1)":[182],"more":[183,243],"robust":[184],"outliers":[186],"compared":[187],"losses;":[193],"(2)":[194],"outperforms":[195],"comparable":[196],"max":[199],"margin":[200],"larger":[203],"scale":[204],"benchmark":[205],"problems;":[206],"(3)":[207],"combined":[209],"with":[210],"Gaussian\u2013Laplacian":[211],"mixture":[212],"prior":[213],"parameters":[215],"kernelized":[217],"version":[218],"our":[220,240],"yields":[222],"sparser":[223],"solutions":[224],"than":[225],"Support":[226],"Vector":[227],"Machine":[228],"classifiers;":[229],"(4)":[231],"prediction":[238],"technique":[239],"provides":[242],"accurate":[244],"probabilities":[245],"yielding":[246],"inference":[248],"increasing":[250],"performance.":[253]},"counts_by_year":[{"year":2021,"cited_by_count":1}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
