{"id":"https://openalex.org/W3043494131","doi":"https://doi.org/10.5220/0009823200780089","title":"On Generating Efficient Data Summaries for Logistic Regression: A Coreset-based Approach","display_name":"On Generating Efficient Data Summaries for Logistic Regression: A Coreset-based Approach","publication_year":2020,"publication_date":"2020-01-01","ids":{"openalex":"https://openalex.org/W3043494131","doi":"https://doi.org/10.5220/0009823200780089","mag":"3043494131"},"language":"en","primary_location":{"id":"doi:10.5220/0009823200780089","is_oa":true,"landing_page_url":"https://doi.org/10.5220/0009823200780089","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 9th International Conference on Data Science, Technology and Applications","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.5220/0009823200780089","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5085913592","display_name":"Nery Riquelme-Granada","orcid":null},"institutions":[{"id":"https://openalex.org/I184558857","display_name":"Royal Holloway University of London","ror":"https://ror.org/04g2vpn86","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I184558857"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Nery Riquelme-Granada","raw_affiliation_strings":["Department of Computer Science, Royal Holloway University of London, Egham, Surrey, TW20 0EX, U.K., --- Select a Country ---"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Royal Holloway University of London, Egham, Surrey, TW20 0EX, U.K., --- Select a Country ---","institution_ids":["https://openalex.org/I184558857"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034957171","display_name":"Khuong An Nguyen","orcid":"https://orcid.org/0000-0001-6198-9295"},"institutions":[{"id":"https://openalex.org/I184558857","display_name":"Royal Holloway University of London","ror":"https://ror.org/04g2vpn86","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I184558857"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Khuong Nguyen","raw_affiliation_strings":["Department of Computer Science, Royal Holloway University of London, Egham, Surrey, TW20 0EX, U.K., --- Select a Country ---"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Royal Holloway University of London, Egham, Surrey, TW20 0EX, U.K., --- Select a Country ---","institution_ids":["https://openalex.org/I184558857"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5070080426","display_name":"Zhiyuan Luo","orcid":"https://orcid.org/0000-0002-3336-3751"},"institutions":[{"id":"https://openalex.org/I184558857","display_name":"Royal Holloway University of London","ror":"https://ror.org/04g2vpn86","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I184558857"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Zhiyuan Luo","raw_affiliation_strings":["Department of Computer Science, Royal Holloway University of London, Egham, Surrey, TW20 0EX, U.K., --- Select a Country ---"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Royal Holloway University of London, Egham, Surrey, TW20 0EX, U.K., --- Select a Country ---","institution_ids":["https://openalex.org/I184558857"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5085913592"],"corresponding_institution_ids":["https://openalex.org/I184558857"],"apc_list":null,"apc_paid":null,"fwci":0.2669,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.63749923,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":93},"biblio":{"volume":null,"issue":null,"first_page":"78","last_page":"89"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9118000268936157,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9118000268936157,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7285172939300537},{"id":"https://openalex.org/keywords/logistic-regression","display_name":"Logistic regression","score":0.7117996215820312},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.26292020082473755}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7285172939300537},{"id":"https://openalex.org/C151956035","wikidata":"https://www.wikidata.org/wiki/Q1132755","display_name":"Logistic regression","level":2,"score":0.7117996215820312},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.26292020082473755}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.5220/0009823200780089","is_oa":true,"landing_page_url":"https://doi.org/10.5220/0009823200780089","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 9th International Conference on Data Science, Technology and Applications","raw_type":"proceedings-article"},{"id":"pmh:oai:pure.atira.dk:openaire/1d3bc81f-6263-4fe0-a2fa-8e6c705fdc8b","is_oa":false,"landing_page_url":"https://research.brighton.ac.uk/en/publications/1d3bc81f-6263-4fe0-a2fa-8e6c705fdc8b","pdf_url":null,"source":{"id":"https://openalex.org/S4306401758","display_name":"University of Brighton Repository (University of Brighton)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I71637028","host_organization_name":"University of Brighton","host_organization_lineage":["https://openalex.org/I71637028"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Riquelme-Granada, N, Nguyen, K A & Luo, Z 2020, On generating efficient data summaries for logistic regression: A coreset-based approach. in S Hammoudi, C Quix & J Bernardino (eds), DATA 2020 - Proceedings of the 9th International Conference on Data Science, Technology and Applications. vol. 1, DATA 2020 - Proceedings of the 9th International Conference on Data Science, Technology and Applications, pp. 78-89, 9th International Conference on Data Science, Technology and Applications (DATA 2020), France, 6/07/20. https://doi.org/10.5220/0009823200780089","raw_type":"contributionToPeriodical"}],"best_oa_location":{"id":"doi:10.5220/0009823200780089","is_oa":true,"landing_page_url":"https://doi.org/10.5220/0009823200780089","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 9th International Conference on Data Science, Technology and Applications","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W607505555","https://openalex.org/W1584308190","https://openalex.org/W1981773323","https://openalex.org/W2045964207","https://openalex.org/W2073459066","https://openalex.org/W2229238337","https://openalex.org/W2404724429","https://openalex.org/W2589206893","https://openalex.org/W2612467436","https://openalex.org/W2616148604","https://openalex.org/W2805004751","https://openalex.org/W4292022450","https://openalex.org/W4294635342"],"related_works":["https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W2376932109","https://openalex.org/W2382290278","https://openalex.org/W2350741829","https://openalex.org/W2130043461","https://openalex.org/W2530322880","https://openalex.org/W1596801655"],"abstract_inverted_index":{"In":[0],"the":[1,23,44,76,89,108,116,126,135,149],"era":[2],"of":[3,5,22,33,37,91,152],"datasets":[4],"unprecedented":[6],"sizes,":[7],"data":[8,38],"compression":[9,30],"techniques":[10],"are":[11,98],"an":[12],"attractive":[13],"approach":[14],"for":[15,27,78,87,93],"speeding":[16],"up":[17],"machine":[18],"learning":[19,59,65,111,123],"algorithms.":[20],"One":[21],"most":[24],"successful":[25],"paradigms":[26],"achieving":[28],"good-quality":[29],"is":[31,75],"that":[32,39,73,142],"coresets:":[34],"small":[35],"summaries":[36],"act":[40],"as":[41],"proxies":[42],"to":[43,52,56,63],"original":[45],"input":[46,128],"data.":[47],"Even":[48],"though":[49],"coresets":[50,92,97],"proved":[51],"be":[53],"extremely":[54],"useful":[55],"accelerate":[57],"unsupervised":[58],"problems,":[60],"applying":[61],"them":[62],"supervised":[64],"problems":[66],"may":[67],"bring":[68],"unexpected":[69],"computational":[70],"bottlenecks.<br/><br/>We":[71],"show":[72],"this":[74,94],"case":[77],"Logistic":[79],"Regression":[80],"classification,":[81],"and":[82,110,130],"hence":[83],"propose":[84],"two":[85],"methods":[86,102],"accelerating":[88,144],"computation":[90],"problem.":[95],"When":[96],"computed":[99],"using":[100],"our":[101,139,143],"on":[103],"three":[104],"public":[105],"datasets,":[106],"computing":[107],"coreset":[109],"from":[112,125],"it":[113],"is,":[114],"in":[115,134],"worst":[117],"case,":[118],"11":[119],"times":[120,132],"faster":[121,133],"than":[122],"directly":[124],"full":[127],"data,":[129],"34":[131],"best":[136],"case.":[137],"Furthermore,":[138],"results":[140],"indicate":[141],"approaches":[145],"do":[146],"not":[147],"degrade":[148],"empirical":[150],"performance":[151],"coresets.":[153]},"counts_by_year":[{"year":2021,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
